ben81828 commited on
Commit
2313c0c
·
verified ·
1 Parent(s): 70d10ac

Training in progress, step 2550, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51ba4cb036f96637ea50997962c817be8981b7c185736e25bcaea373e2187935
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1423743ef577d043d7175f7e7d833ad5439113f93d35aae3b6833a3cf0e1cb32
3
  size 29034840
last-checkpoint/global_step2550/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f29a88ea5d9b70f23bfc7d8df4834f8ec9eb3984889b6eb41c4fc4e0dfe55520
3
+ size 43429616
last-checkpoint/global_step2550/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38359757b3fbb8e96e3ff3913f5d0aa896569c07d080dd28fdfb26ae27ac5c3c
3
+ size 43429616
last-checkpoint/global_step2550/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aa6a53eda7f26bba15fd86b7065e2ec7fab955a6a5a2721e0b2618778f45fe0
3
+ size 43429616
last-checkpoint/global_step2550/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2004ed1d03646db619ab4a937a8568de4e2b1a108c0f28378de10e0a8693edf8
3
+ size 43429616
last-checkpoint/global_step2550/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:459c71b1156c55fcd73acb65442792d22282e3260b89f66cdf8ad0815d56f457
3
+ size 637299
last-checkpoint/global_step2550/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c42effbfd8441de135408f95c55462d6c1c4c8dd96b6417b67de471d2e95afcb
3
+ size 637171
last-checkpoint/global_step2550/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:304c5ba32c89fec95d937699d77819f8e533af674d93476e22a507dac625cebf
3
+ size 637171
last-checkpoint/global_step2550/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcaea5da1d1730a97458c88513e37f66edcf7420f14ca71eb82cab77a1de4424
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step2500
 
1
+ global_step2550
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a97c73c15a2a5b2de7dc426a700b2053aee43809425431c513cc5e3aab6c2107
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0362dfd92e8da01e4a0deedcbd1c493b8162d5d1d84d5a4c1cd210c556f2cf9b
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1296b339c1b16ab7e14352a269004d20ede428aef748283fb0a6650d62f58129
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65c5adee1a22c5343e38495a6905880496fb22d5e3ec5b16b87aadb731969d2
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:000b1637f5e73170f2337500a6a083df3a43d967d642b6c3a68f60deb6c3b960
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8d8858483b0c6944d55621cc2633469e3e0d04c48b6671eee92d4abab2352c2
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8bcb6e7802f6d888bc099642911087298cfb1adf7053a2d43a67192a53404ef
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca42ef4f7a2f8c2285c4cf6cef585dcc0b132b21e8bb33d96d53b6db837f5e54
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be10edf7c6be9f43df78beaad8c1006d912dae1be4452d19b94e400653092195
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67937b6f5a5203cd96f4ea9c985d72d16ed7c92555e94021ae353606f325a9ea
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.1869634985923767,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
4
- "epoch": 0.7385524372230429,
5
  "eval_steps": 50,
6
- "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4457,11 +4457,100 @@
4457
  "eval_steps_per_second": 0.784,
4458
  "num_input_tokens_seen": 25961056,
4459
  "step": 2500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4460
  }
4461
  ],
4462
  "logging_steps": 5,
4463
  "max_steps": 6770,
4464
- "num_input_tokens_seen": 25961056,
4465
  "num_train_epochs": 2,
4466
  "save_steps": 50,
4467
  "stateful_callbacks": {
@@ -4476,7 +4565,7 @@
4476
  "attributes": {}
4477
  }
4478
  },
4479
- "total_flos": 1712735614402560.0,
4480
  "train_batch_size": 1,
4481
  "trial_name": null,
4482
  "trial_params": null
 
1
  {
2
  "best_metric": 0.1869634985923767,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
4
+ "epoch": 0.7533234859675036,
5
  "eval_steps": 50,
6
+ "global_step": 2550,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4457
  "eval_steps_per_second": 0.784,
4458
  "num_input_tokens_seen": 25961056,
4459
  "step": 2500
4460
+ },
4461
+ {
4462
+ "epoch": 0.740029542097489,
4463
+ "grad_norm": 3.4127573468108934,
4464
+ "learning_rate": 7.452610450181865e-05,
4465
+ "loss": 0.2843,
4466
+ "num_input_tokens_seen": 26012232,
4467
+ "step": 2505
4468
+ },
4469
+ {
4470
+ "epoch": 0.741506646971935,
4471
+ "grad_norm": 1.8065383217954118,
4472
+ "learning_rate": 7.441960654426687e-05,
4473
+ "loss": 0.2376,
4474
+ "num_input_tokens_seen": 26064432,
4475
+ "step": 2510
4476
+ },
4477
+ {
4478
+ "epoch": 0.7429837518463811,
4479
+ "grad_norm": 1.038286812818806,
4480
+ "learning_rate": 7.431296289958735e-05,
4481
+ "loss": 0.2464,
4482
+ "num_input_tokens_seen": 26115856,
4483
+ "step": 2515
4484
+ },
4485
+ {
4486
+ "epoch": 0.7444608567208272,
4487
+ "grad_norm": 1.3908978510260759,
4488
+ "learning_rate": 7.4206174204015e-05,
4489
+ "loss": 0.2793,
4490
+ "num_input_tokens_seen": 26167176,
4491
+ "step": 2520
4492
+ },
4493
+ {
4494
+ "epoch": 0.7459379615952733,
4495
+ "grad_norm": 1.785011959334391,
4496
+ "learning_rate": 7.409924109465011e-05,
4497
+ "loss": 0.2141,
4498
+ "num_input_tokens_seen": 26219144,
4499
+ "step": 2525
4500
+ },
4501
+ {
4502
+ "epoch": 0.7474150664697193,
4503
+ "grad_norm": 1.0393762543520273,
4504
+ "learning_rate": 7.399216420945453e-05,
4505
+ "loss": 0.2137,
4506
+ "num_input_tokens_seen": 26271712,
4507
+ "step": 2530
4508
+ },
4509
+ {
4510
+ "epoch": 0.7488921713441654,
4511
+ "grad_norm": 5.12895726872253,
4512
+ "learning_rate": 7.388494418724789e-05,
4513
+ "loss": 0.2177,
4514
+ "num_input_tokens_seen": 26323656,
4515
+ "step": 2535
4516
+ },
4517
+ {
4518
+ "epoch": 0.7503692762186115,
4519
+ "grad_norm": 9.06455667620907,
4520
+ "learning_rate": 7.377758166770377e-05,
4521
+ "loss": 0.2762,
4522
+ "num_input_tokens_seen": 26375392,
4523
+ "step": 2540
4524
+ },
4525
+ {
4526
+ "epoch": 0.7518463810930576,
4527
+ "grad_norm": 1.4100384205361678,
4528
+ "learning_rate": 7.367007729134588e-05,
4529
+ "loss": 0.2794,
4530
+ "num_input_tokens_seen": 26426080,
4531
+ "step": 2545
4532
+ },
4533
+ {
4534
+ "epoch": 0.7533234859675036,
4535
+ "grad_norm": 0.9925649690798728,
4536
+ "learning_rate": 7.356243169954426e-05,
4537
+ "loss": 0.2364,
4538
+ "num_input_tokens_seen": 26477208,
4539
+ "step": 2550
4540
+ },
4541
+ {
4542
+ "epoch": 0.7533234859675036,
4543
+ "eval_loss": 0.38712552189826965,
4544
+ "eval_runtime": 19.0707,
4545
+ "eval_samples_per_second": 3.146,
4546
+ "eval_steps_per_second": 0.787,
4547
+ "num_input_tokens_seen": 26477208,
4548
+ "step": 2550
4549
  }
4550
  ],
4551
  "logging_steps": 5,
4552
  "max_steps": 6770,
4553
+ "num_input_tokens_seen": 26477208,
4554
  "num_train_epochs": 2,
4555
  "save_steps": 50,
4556
  "stateful_callbacks": {
 
4565
  "attributes": {}
4566
  }
4567
  },
4568
+ "total_flos": 1746750507581440.0,
4569
  "train_batch_size": 1,
4570
  "trial_name": null,
4571
  "trial_params": null