Training in progress, step 3100, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step3100/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3100/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3100/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3100/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3100/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3100/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3100/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3100/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +93 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e16399a54feade86bfbf61a8556cd130e7f0cb7bcc816ba08b4856dddb7606a
|
3 |
size 29034840
|
last-checkpoint/global_step3100/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6442e5ae9de93ac10a49957a278a8a63d68a76b5e1df84a2a5207fcdfdfe5303
|
3 |
+
size 43429616
|
last-checkpoint/global_step3100/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6148ab1901e304f398bc54c299448042794f7778437012ec25bea1e0a271e0e
|
3 |
+
size 43429616
|
last-checkpoint/global_step3100/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e45c316e0222d4db8f427c991e41ed7b9093eaa68eabafbe2505a1c9e031d0f
|
3 |
+
size 43429616
|
last-checkpoint/global_step3100/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecd92104d8c6c8c164703d77b771b654c64c485a242b292c5c9903c253fface5
|
3 |
+
size 43429616
|
last-checkpoint/global_step3100/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:769a527c4e6f510809f5b2b13928892b9b7024384bc00772661a2cccde5e4fa4
|
3 |
+
size 637299
|
last-checkpoint/global_step3100/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d05589d1f79cab339f6f64907a5dbf1bd44b1e8d65a9a1f019d2ec8e2b3cd2a6
|
3 |
+
size 637171
|
last-checkpoint/global_step3100/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e28ad7a834b66d1ee2fe12359362f2fdb764eaf9b451b44e1d6df40abfd8079c
|
3 |
+
size 637171
|
last-checkpoint/global_step3100/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:226452aea7fb29b0cd6c8e9e340122bb65353ec4a0df00019fe9614dc4195bc6
|
3 |
+
size 637171
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step3100
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:381f090b12cbb3fcce976bd2e72d07a7786154c2848cc881d75715648e7c4dc2
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4321dc1beb6c245d4a16a8fb2bed2ce2a40d89e5a9c611c4572f63a09523846c
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b79020117e301cd96518c9d1e3eb43a609bc85799f14bac63d9c572fc04cb89
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5429623c7323b4a820ea3d76194bc456c2affeeb1f3af8978aec5aee11b2d1ef
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3b3f02f00a06f9630f63af0f9d2eac4db52dcd348e24cd0a92f7c194ed5add6
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.1869634985923767,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -5436,11 +5436,100 @@
|
|
5436 |
"eval_steps_per_second": 0.779,
|
5437 |
"num_input_tokens_seen": 31679080,
|
5438 |
"step": 3050
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5439 |
}
|
5440 |
],
|
5441 |
"logging_steps": 5,
|
5442 |
"max_steps": 6770,
|
5443 |
-
"num_input_tokens_seen":
|
5444 |
"num_train_epochs": 2,
|
5445 |
"save_steps": 50,
|
5446 |
"stateful_callbacks": {
|
@@ -5455,7 +5544,7 @@
|
|
5455 |
"attributes": {}
|
5456 |
}
|
5457 |
},
|
5458 |
-
"total_flos":
|
5459 |
"train_batch_size": 1,
|
5460 |
"trial_name": null,
|
5461 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.1869634985923767,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
|
4 |
+
"epoch": 0.9158050221565731,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 3100,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
5436 |
"eval_steps_per_second": 0.779,
|
5437 |
"num_input_tokens_seen": 31679080,
|
5438 |
"step": 3050
|
5439 |
+
},
|
5440 |
+
{
|
5441 |
+
"epoch": 0.9025110782865583,
|
5442 |
+
"grad_norm": 1.1996422945391199,
|
5443 |
+
"learning_rate": 6.207976753619816e-05,
|
5444 |
+
"loss": 0.1854,
|
5445 |
+
"num_input_tokens_seen": 31731232,
|
5446 |
+
"step": 3055
|
5447 |
+
},
|
5448 |
+
{
|
5449 |
+
"epoch": 0.9039881831610044,
|
5450 |
+
"grad_norm": 1.142249274568305,
|
5451 |
+
"learning_rate": 6.196122246447779e-05,
|
5452 |
+
"loss": 0.1813,
|
5453 |
+
"num_input_tokens_seen": 31783480,
|
5454 |
+
"step": 3060
|
5455 |
+
},
|
5456 |
+
{
|
5457 |
+
"epoch": 0.9054652880354506,
|
5458 |
+
"grad_norm": 1.8891844898246446,
|
5459 |
+
"learning_rate": 6.184260603222416e-05,
|
5460 |
+
"loss": 0.2099,
|
5461 |
+
"num_input_tokens_seen": 31835864,
|
5462 |
+
"step": 3065
|
5463 |
+
},
|
5464 |
+
{
|
5465 |
+
"epoch": 0.9069423929098966,
|
5466 |
+
"grad_norm": 1.1771283819772904,
|
5467 |
+
"learning_rate": 6.17239189471017e-05,
|
5468 |
+
"loss": 0.2158,
|
5469 |
+
"num_input_tokens_seen": 31887120,
|
5470 |
+
"step": 3070
|
5471 |
+
},
|
5472 |
+
{
|
5473 |
+
"epoch": 0.9084194977843427,
|
5474 |
+
"grad_norm": 1.000017408106927,
|
5475 |
+
"learning_rate": 6.160516191719638e-05,
|
5476 |
+
"loss": 0.1947,
|
5477 |
+
"num_input_tokens_seen": 31938768,
|
5478 |
+
"step": 3075
|
5479 |
+
},
|
5480 |
+
{
|
5481 |
+
"epoch": 0.9098966026587888,
|
5482 |
+
"grad_norm": 10.76780458746382,
|
5483 |
+
"learning_rate": 6.148633565101145e-05,
|
5484 |
+
"loss": 0.2058,
|
5485 |
+
"num_input_tokens_seen": 31990800,
|
5486 |
+
"step": 3080
|
5487 |
+
},
|
5488 |
+
{
|
5489 |
+
"epoch": 0.9113737075332349,
|
5490 |
+
"grad_norm": 1.5246138398849078,
|
5491 |
+
"learning_rate": 6.136744085746322e-05,
|
5492 |
+
"loss": 0.2366,
|
5493 |
+
"num_input_tokens_seen": 32042096,
|
5494 |
+
"step": 3085
|
5495 |
+
},
|
5496 |
+
{
|
5497 |
+
"epoch": 0.912850812407681,
|
5498 |
+
"grad_norm": 1.3169793573688027,
|
5499 |
+
"learning_rate": 6.124847824587684e-05,
|
5500 |
+
"loss": 0.2749,
|
5501 |
+
"num_input_tokens_seen": 32092864,
|
5502 |
+
"step": 3090
|
5503 |
+
},
|
5504 |
+
{
|
5505 |
+
"epoch": 0.914327917282127,
|
5506 |
+
"grad_norm": 1.0350686863717118,
|
5507 |
+
"learning_rate": 6.112944852598205e-05,
|
5508 |
+
"loss": 0.2242,
|
5509 |
+
"num_input_tokens_seen": 32144288,
|
5510 |
+
"step": 3095
|
5511 |
+
},
|
5512 |
+
{
|
5513 |
+
"epoch": 0.9158050221565731,
|
5514 |
+
"grad_norm": 0.8553950294390508,
|
5515 |
+
"learning_rate": 6.1010352407908966e-05,
|
5516 |
+
"loss": 0.1999,
|
5517 |
+
"num_input_tokens_seen": 32196176,
|
5518 |
+
"step": 3100
|
5519 |
+
},
|
5520 |
+
{
|
5521 |
+
"epoch": 0.9158050221565731,
|
5522 |
+
"eval_loss": 0.2710443437099457,
|
5523 |
+
"eval_runtime": 19.0309,
|
5524 |
+
"eval_samples_per_second": 3.153,
|
5525 |
+
"eval_steps_per_second": 0.788,
|
5526 |
+
"num_input_tokens_seen": 32196176,
|
5527 |
+
"step": 3100
|
5528 |
}
|
5529 |
],
|
5530 |
"logging_steps": 5,
|
5531 |
"max_steps": 6770,
|
5532 |
+
"num_input_tokens_seen": 32196176,
|
5533 |
"num_train_epochs": 2,
|
5534 |
"save_steps": 50,
|
5535 |
"stateful_callbacks": {
|
|
|
5544 |
"attributes": {}
|
5545 |
}
|
5546 |
},
|
5547 |
+
"total_flos": 2124006796820480.0,
|
5548 |
"train_batch_size": 1,
|
5549 |
"trial_name": null,
|
5550 |
"trial_params": null
|