Training in progress, step 2350, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step2350/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2350/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2350/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2350/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2350/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step2350/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step2350/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step2350/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +95 -6
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e895c1cddd40eb0dbe387456240309b06d66fe014fd793905368c3b37bbbff4a
|
3 |
size 29034840
|
last-checkpoint/global_step2350/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e64eef91b1c41414b86c1c79785e71b08863e11060ff8cc3ef7864e7ebdfd9ea
|
3 |
+
size 43429616
|
last-checkpoint/global_step2350/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e5375885f162d12b5216a73c6bb52338439850ad1e62fb1c7c0c1edab8bc406
|
3 |
+
size 43429616
|
last-checkpoint/global_step2350/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9591fd0143ecbd5381bf4045248702d04a33777473a65e109ac0ff4e0b72032
|
3 |
+
size 43429616
|
last-checkpoint/global_step2350/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f2bea725eb09303fe4967379db3c2f97314752353eb0873dd28f22e85954261
|
3 |
+
size 43429616
|
last-checkpoint/global_step2350/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77ea2f1422947988eee2012dbb023c20b562004f04b0280a6b2e02eb0104df6c
|
3 |
+
size 637299
|
last-checkpoint/global_step2350/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d2de4b133830a36a27f5675bcfb3196e62844d0ea6515c1da4410138b5a0d55
|
3 |
+
size 637171
|
last-checkpoint/global_step2350/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efb4f0a348ba8ed1a0f899c6bd11b00341b3cb75bef3c71ead62d8cdd2a38d6d
|
3 |
+
size 637171
|
last-checkpoint/global_step2350/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddee7cdbd3744f566b1d3de4032edc8a6be338074790be0b4e6dd344c41978e2
|
3 |
+
size 637171
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step2350
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f12bf3da75454e5aae4644f2a1d46fdf90f68e680dbf5bdaa86861f825d32d80
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2faef1b8798e7516fd96ee7b3363866a8f97ca2d0ec5a8dd27bbfe70b0c6a733
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f35f6d27fbd414dd4285d91816b37fb6b97ff10fbba4c074d56ad2a7f723033
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea5c64dfc7e3b2729065483dfef8e4bb0af0d9bae32df888d258ee3c2859d676
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8d0442374b2f8618569ef196bfe7955aa6b552a4eb29da5972e99b6fb6a7877
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -4101,11 +4101,100 @@
|
|
4101 |
"eval_steps_per_second": 0.791,
|
4102 |
"num_input_tokens_seen": 23883032,
|
4103 |
"step": 2300
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4104 |
}
|
4105 |
],
|
4106 |
"logging_steps": 5,
|
4107 |
"max_steps": 6770,
|
4108 |
-
"num_input_tokens_seen":
|
4109 |
"num_train_epochs": 2,
|
4110 |
"save_steps": 50,
|
4111 |
"stateful_callbacks": {
|
@@ -4120,7 +4209,7 @@
|
|
4120 |
"attributes": {}
|
4121 |
}
|
4122 |
},
|
4123 |
-
"total_flos":
|
4124 |
"train_batch_size": 1,
|
4125 |
"trial_name": null,
|
4126 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.1869634985923767,
|
3 |
+
"best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
|
4 |
+
"epoch": 0.6942392909896603,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 2350,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
4101 |
"eval_steps_per_second": 0.791,
|
4102 |
"num_input_tokens_seen": 23883032,
|
4103 |
"step": 2300
|
4104 |
+
},
|
4105 |
+
{
|
4106 |
+
"epoch": 0.6809453471196455,
|
4107 |
+
"grad_norm": 15.468575933907964,
|
4108 |
+
"learning_rate": 7.865936626267243e-05,
|
4109 |
+
"loss": 0.2474,
|
4110 |
+
"num_input_tokens_seen": 23934880,
|
4111 |
+
"step": 2305
|
4112 |
+
},
|
4113 |
+
{
|
4114 |
+
"epoch": 0.6824224519940916,
|
4115 |
+
"grad_norm": 3.9259269918244932,
|
4116 |
+
"learning_rate": 7.855920710508009e-05,
|
4117 |
+
"loss": 0.2613,
|
4118 |
+
"num_input_tokens_seen": 23986160,
|
4119 |
+
"step": 2310
|
4120 |
+
},
|
4121 |
+
{
|
4122 |
+
"epoch": 0.6838995568685377,
|
4123 |
+
"grad_norm": 1.443222642921112,
|
4124 |
+
"learning_rate": 7.845887756354458e-05,
|
4125 |
+
"loss": 0.1957,
|
4126 |
+
"num_input_tokens_seen": 24038984,
|
4127 |
+
"step": 2315
|
4128 |
+
},
|
4129 |
+
{
|
4130 |
+
"epoch": 0.6853766617429837,
|
4131 |
+
"grad_norm": 2.418773014069429,
|
4132 |
+
"learning_rate": 7.835837823663092e-05,
|
4133 |
+
"loss": 0.2709,
|
4134 |
+
"num_input_tokens_seen": 24090648,
|
4135 |
+
"step": 2320
|
4136 |
+
},
|
4137 |
+
{
|
4138 |
+
"epoch": 0.6868537666174298,
|
4139 |
+
"grad_norm": 1.2678547091245644,
|
4140 |
+
"learning_rate": 7.825770972391712e-05,
|
4141 |
+
"loss": 0.2873,
|
4142 |
+
"num_input_tokens_seen": 24142200,
|
4143 |
+
"step": 2325
|
4144 |
+
},
|
4145 |
+
{
|
4146 |
+
"epoch": 0.6883308714918759,
|
4147 |
+
"grad_norm": 1.5899740505737827,
|
4148 |
+
"learning_rate": 7.81568726259905e-05,
|
4149 |
+
"loss": 0.2378,
|
4150 |
+
"num_input_tokens_seen": 24194400,
|
4151 |
+
"step": 2330
|
4152 |
+
},
|
4153 |
+
{
|
4154 |
+
"epoch": 0.689807976366322,
|
4155 |
+
"grad_norm": 1.6209911075093861,
|
4156 |
+
"learning_rate": 7.805586754444416e-05,
|
4157 |
+
"loss": 0.2615,
|
4158 |
+
"num_input_tokens_seen": 24245328,
|
4159 |
+
"step": 2335
|
4160 |
+
},
|
4161 |
+
{
|
4162 |
+
"epoch": 0.691285081240768,
|
4163 |
+
"grad_norm": 16.06254938606901,
|
4164 |
+
"learning_rate": 7.795469508187343e-05,
|
4165 |
+
"loss": 0.2234,
|
4166 |
+
"num_input_tokens_seen": 24297400,
|
4167 |
+
"step": 2340
|
4168 |
+
},
|
4169 |
+
{
|
4170 |
+
"epoch": 0.6927621861152142,
|
4171 |
+
"grad_norm": 2.2353075576651085,
|
4172 |
+
"learning_rate": 7.785335584187219e-05,
|
4173 |
+
"loss": 0.2833,
|
4174 |
+
"num_input_tokens_seen": 24348536,
|
4175 |
+
"step": 2345
|
4176 |
+
},
|
4177 |
+
{
|
4178 |
+
"epoch": 0.6942392909896603,
|
4179 |
+
"grad_norm": 11.321777956495533,
|
4180 |
+
"learning_rate": 7.775185042902933e-05,
|
4181 |
+
"loss": 0.2313,
|
4182 |
+
"num_input_tokens_seen": 24401256,
|
4183 |
+
"step": 2350
|
4184 |
+
},
|
4185 |
+
{
|
4186 |
+
"epoch": 0.6942392909896603,
|
4187 |
+
"eval_loss": 0.1869634985923767,
|
4188 |
+
"eval_runtime": 19.499,
|
4189 |
+
"eval_samples_per_second": 3.077,
|
4190 |
+
"eval_steps_per_second": 0.769,
|
4191 |
+
"num_input_tokens_seen": 24401256,
|
4192 |
+
"step": 2350
|
4193 |
}
|
4194 |
],
|
4195 |
"logging_steps": 5,
|
4196 |
"max_steps": 6770,
|
4197 |
+
"num_input_tokens_seen": 24401256,
|
4198 |
"num_train_epochs": 2,
|
4199 |
"save_steps": 50,
|
4200 |
"stateful_callbacks": {
|
|
|
4209 |
"attributes": {}
|
4210 |
}
|
4211 |
},
|
4212 |
+
"total_flos": 1609869937344512.0,
|
4213 |
"train_batch_size": 1,
|
4214 |
"trial_name": null,
|
4215 |
"trial_params": null
|