Training in progress, step 2400, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step2400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step2400/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step2400/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step2400/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step2400/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +93 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:724b21694b2108c1eedcec3aba788b5559aed494f8af9352c85fe7551b55f69c
|
3 |
size 29034840
|
last-checkpoint/global_step2400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d6f8ac48914dc4e7a50fa8cbfe71666cbf805142b9aec062a3a058e0e40e6b4
|
3 |
+
size 43429616
|
last-checkpoint/global_step2400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8447d79e1990e976bf439b347c7e02eaec26da92a21ead32bee85b8426c2fbe
|
3 |
+
size 43429616
|
last-checkpoint/global_step2400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bce02bc6a8b1239b3d666121512b78ca7e2cf74a6eb51c2ee283f4bd9c6afcaa
|
3 |
+
size 43429616
|
last-checkpoint/global_step2400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf5efa42fc216ceaf721bcd6bd557cebcfb1be06ad53cfcae73b2caa1ecea8aa
|
3 |
+
size 43429616
|
last-checkpoint/global_step2400/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb28cb80645e4e5b08d929feb6cb284b80b9374d0abb5cac7a034e04e045bf67
|
3 |
+
size 637299
|
last-checkpoint/global_step2400/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e18a2b0b8ad83bd9cd5698849f6aafc46f23435824e7200c2e85a9eb4e492a1
|
3 |
+
size 637171
|
last-checkpoint/global_step2400/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc63c2624e3a26f46cb4e76250e1daf40e4de23f6d0694e319d1c3d09e6246cc
|
3 |
+
size 637171
|
last-checkpoint/global_step2400/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9469a2da3dcd4ac7538c85ff2efc3e7edb38b7bb9ddacc4ebbcca32aabfa5fe
|
3 |
+
size 637171
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step2400
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:681faefe4cf303ca7f9bc3073b09b166da4f558d55bee3d5eee90ba5d83159bb
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0fb250f1d137fb55cef85743a342508178b4fe3a20c6793c82e279730ea280b
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34a0d7cfaa34f7e3738b4ef4989d693ed7864fed3b2a44ef1b6892fdcf026bb9
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a82aabe23bc62e289ef7d075c79f353bbc81286ec0f8964eabda4209d630e10
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9534ff0afb419b8df69ec6dd9eaf407a5fa510c1fc235b2fb5d794e6ea2faecd
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.1869634985923767,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -4190,11 +4190,100 @@
|
|
4190 |
"eval_steps_per_second": 0.769,
|
4191 |
"num_input_tokens_seen": 24401256,
|
4192 |
"step": 2350
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4193 |
}
|
4194 |
],
|
4195 |
"logging_steps": 5,
|
4196 |
"max_steps": 6770,
|
4197 |
-
"num_input_tokens_seen":
|
4198 |
"num_train_epochs": 2,
|
4199 |
"save_steps": 50,
|
4200 |
"stateful_callbacks": {
|
@@ -4209,7 +4298,7 @@
|
|
4209 |
"attributes": {}
|
4210 |
}
|
4211 |
},
|
4212 |
-
"total_flos":
|
4213 |
"train_batch_size": 1,
|
4214 |
"trial_name": null,
|
4215 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.1869634985923767,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
|
4 |
+
"epoch": 0.7090103397341211,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 2400,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
4190 |
"eval_steps_per_second": 0.769,
|
4191 |
"num_input_tokens_seen": 24401256,
|
4192 |
"step": 2350
|
4193 |
+
},
|
4194 |
+
{
|
4195 |
+
"epoch": 0.6957163958641064,
|
4196 |
+
"grad_norm": 1.2627287884293426,
|
4197 |
+
"learning_rate": 7.765017944892514e-05,
|
4198 |
+
"loss": 0.2499,
|
4199 |
+
"num_input_tokens_seen": 24453384,
|
4200 |
+
"step": 2355
|
4201 |
+
},
|
4202 |
+
{
|
4203 |
+
"epoch": 0.6971935007385525,
|
4204 |
+
"grad_norm": 1.476393664852338,
|
4205 |
+
"learning_rate": 7.754834350812765e-05,
|
4206 |
+
"loss": 0.2132,
|
4207 |
+
"num_input_tokens_seen": 24505960,
|
4208 |
+
"step": 2360
|
4209 |
+
},
|
4210 |
+
{
|
4211 |
+
"epoch": 0.6986706056129985,
|
4212 |
+
"grad_norm": 3.9395522365245226,
|
4213 |
+
"learning_rate": 7.744634321418906e-05,
|
4214 |
+
"loss": 0.2049,
|
4215 |
+
"num_input_tokens_seen": 24559008,
|
4216 |
+
"step": 2365
|
4217 |
+
},
|
4218 |
+
{
|
4219 |
+
"epoch": 0.7001477104874446,
|
4220 |
+
"grad_norm": 2.1895254551218115,
|
4221 |
+
"learning_rate": 7.734417917564211e-05,
|
4222 |
+
"loss": 0.2222,
|
4223 |
+
"num_input_tokens_seen": 24611128,
|
4224 |
+
"step": 2370
|
4225 |
+
},
|
4226 |
+
{
|
4227 |
+
"epoch": 0.7016248153618907,
|
4228 |
+
"grad_norm": 2.3733905521598353,
|
4229 |
+
"learning_rate": 7.724185200199643e-05,
|
4230 |
+
"loss": 0.2678,
|
4231 |
+
"num_input_tokens_seen": 24662336,
|
4232 |
+
"step": 2375
|
4233 |
+
},
|
4234 |
+
{
|
4235 |
+
"epoch": 0.7031019202363368,
|
4236 |
+
"grad_norm": 6.930201726148201,
|
4237 |
+
"learning_rate": 7.713936230373491e-05,
|
4238 |
+
"loss": 0.2888,
|
4239 |
+
"num_input_tokens_seen": 24714032,
|
4240 |
+
"step": 2380
|
4241 |
+
},
|
4242 |
+
{
|
4243 |
+
"epoch": 0.7045790251107829,
|
4244 |
+
"grad_norm": 1.2305357870388025,
|
4245 |
+
"learning_rate": 7.703671069231007e-05,
|
4246 |
+
"loss": 0.2609,
|
4247 |
+
"num_input_tokens_seen": 24765296,
|
4248 |
+
"step": 2385
|
4249 |
+
},
|
4250 |
+
{
|
4251 |
+
"epoch": 0.7060561299852289,
|
4252 |
+
"grad_norm": 1.3830979392967684,
|
4253 |
+
"learning_rate": 7.693389778014037e-05,
|
4254 |
+
"loss": 0.2654,
|
4255 |
+
"num_input_tokens_seen": 24816744,
|
4256 |
+
"step": 2390
|
4257 |
+
},
|
4258 |
+
{
|
4259 |
+
"epoch": 0.707533234859675,
|
4260 |
+
"grad_norm": 1.641476112098168,
|
4261 |
+
"learning_rate": 7.683092418060664e-05,
|
4262 |
+
"loss": 0.2231,
|
4263 |
+
"num_input_tokens_seen": 24869320,
|
4264 |
+
"step": 2395
|
4265 |
+
},
|
4266 |
+
{
|
4267 |
+
"epoch": 0.7090103397341211,
|
4268 |
+
"grad_norm": 9.651892844655563,
|
4269 |
+
"learning_rate": 7.672779050804834e-05,
|
4270 |
+
"loss": 0.262,
|
4271 |
+
"num_input_tokens_seen": 24921872,
|
4272 |
+
"step": 2400
|
4273 |
+
},
|
4274 |
+
{
|
4275 |
+
"epoch": 0.7090103397341211,
|
4276 |
+
"eval_loss": 0.34713664650917053,
|
4277 |
+
"eval_runtime": 18.9635,
|
4278 |
+
"eval_samples_per_second": 3.164,
|
4279 |
+
"eval_steps_per_second": 0.791,
|
4280 |
+
"num_input_tokens_seen": 24921872,
|
4281 |
+
"step": 2400
|
4282 |
}
|
4283 |
],
|
4284 |
"logging_steps": 5,
|
4285 |
"max_steps": 6770,
|
4286 |
+
"num_input_tokens_seen": 24921872,
|
4287 |
"num_train_epochs": 2,
|
4288 |
"save_steps": 50,
|
4289 |
"stateful_callbacks": {
|
|
|
4298 |
"attributes": {}
|
4299 |
}
|
4300 |
},
|
4301 |
+
"total_flos": 1644216510578688.0,
|
4302 |
"train_batch_size": 1,
|
4303 |
"trial_name": null,
|
4304 |
"trial_params": null
|