ben81828 commited on
Commit
2eb3756
·
verified ·
1 Parent(s): 2624e20

Training in progress, step 2400, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e895c1cddd40eb0dbe387456240309b06d66fe014fd793905368c3b37bbbff4a
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:724b21694b2108c1eedcec3aba788b5559aed494f8af9352c85fe7551b55f69c
3
  size 29034840
last-checkpoint/global_step2400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d6f8ac48914dc4e7a50fa8cbfe71666cbf805142b9aec062a3a058e0e40e6b4
3
+ size 43429616
last-checkpoint/global_step2400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8447d79e1990e976bf439b347c7e02eaec26da92a21ead32bee85b8426c2fbe
3
+ size 43429616
last-checkpoint/global_step2400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce02bc6a8b1239b3d666121512b78ca7e2cf74a6eb51c2ee283f4bd9c6afcaa
3
+ size 43429616
last-checkpoint/global_step2400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf5efa42fc216ceaf721bcd6bd557cebcfb1be06ad53cfcae73b2caa1ecea8aa
3
+ size 43429616
last-checkpoint/global_step2400/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb28cb80645e4e5b08d929feb6cb284b80b9374d0abb5cac7a034e04e045bf67
3
+ size 637299
last-checkpoint/global_step2400/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e18a2b0b8ad83bd9cd5698849f6aafc46f23435824e7200c2e85a9eb4e492a1
3
+ size 637171
last-checkpoint/global_step2400/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc63c2624e3a26f46cb4e76250e1daf40e4de23f6d0694e319d1c3d09e6246cc
3
+ size 637171
last-checkpoint/global_step2400/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9469a2da3dcd4ac7538c85ff2efc3e7edb38b7bb9ddacc4ebbcca32aabfa5fe
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step2350
 
1
+ global_step2400
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f12bf3da75454e5aae4644f2a1d46fdf90f68e680dbf5bdaa86861f825d32d80
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:681faefe4cf303ca7f9bc3073b09b166da4f558d55bee3d5eee90ba5d83159bb
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2faef1b8798e7516fd96ee7b3363866a8f97ca2d0ec5a8dd27bbfe70b0c6a733
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0fb250f1d137fb55cef85743a342508178b4fe3a20c6793c82e279730ea280b
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f35f6d27fbd414dd4285d91816b37fb6b97ff10fbba4c074d56ad2a7f723033
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34a0d7cfaa34f7e3738b4ef4989d693ed7864fed3b2a44ef1b6892fdcf026bb9
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea5c64dfc7e3b2729065483dfef8e4bb0af0d9bae32df888d258ee3c2859d676
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a82aabe23bc62e289ef7d075c79f353bbc81286ec0f8964eabda4209d630e10
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8d0442374b2f8618569ef196bfe7955aa6b552a4eb29da5972e99b6fb6a7877
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9534ff0afb419b8df69ec6dd9eaf407a5fa510c1fc235b2fb5d794e6ea2faecd
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.1869634985923767,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
4
- "epoch": 0.6942392909896603,
5
  "eval_steps": 50,
6
- "global_step": 2350,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4190,11 +4190,100 @@
4190
  "eval_steps_per_second": 0.769,
4191
  "num_input_tokens_seen": 24401256,
4192
  "step": 2350
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4193
  }
4194
  ],
4195
  "logging_steps": 5,
4196
  "max_steps": 6770,
4197
- "num_input_tokens_seen": 24401256,
4198
  "num_train_epochs": 2,
4199
  "save_steps": 50,
4200
  "stateful_callbacks": {
@@ -4209,7 +4298,7 @@
4209
  "attributes": {}
4210
  }
4211
  },
4212
- "total_flos": 1609869937344512.0,
4213
  "train_batch_size": 1,
4214
  "trial_name": null,
4215
  "trial_params": null
 
1
  {
2
  "best_metric": 0.1869634985923767,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
4
+ "epoch": 0.7090103397341211,
5
  "eval_steps": 50,
6
+ "global_step": 2400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4190
  "eval_steps_per_second": 0.769,
4191
  "num_input_tokens_seen": 24401256,
4192
  "step": 2350
4193
+ },
4194
+ {
4195
+ "epoch": 0.6957163958641064,
4196
+ "grad_norm": 1.2627287884293426,
4197
+ "learning_rate": 7.765017944892514e-05,
4198
+ "loss": 0.2499,
4199
+ "num_input_tokens_seen": 24453384,
4200
+ "step": 2355
4201
+ },
4202
+ {
4203
+ "epoch": 0.6971935007385525,
4204
+ "grad_norm": 1.476393664852338,
4205
+ "learning_rate": 7.754834350812765e-05,
4206
+ "loss": 0.2132,
4207
+ "num_input_tokens_seen": 24505960,
4208
+ "step": 2360
4209
+ },
4210
+ {
4211
+ "epoch": 0.6986706056129985,
4212
+ "grad_norm": 3.9395522365245226,
4213
+ "learning_rate": 7.744634321418906e-05,
4214
+ "loss": 0.2049,
4215
+ "num_input_tokens_seen": 24559008,
4216
+ "step": 2365
4217
+ },
4218
+ {
4219
+ "epoch": 0.7001477104874446,
4220
+ "grad_norm": 2.1895254551218115,
4221
+ "learning_rate": 7.734417917564211e-05,
4222
+ "loss": 0.2222,
4223
+ "num_input_tokens_seen": 24611128,
4224
+ "step": 2370
4225
+ },
4226
+ {
4227
+ "epoch": 0.7016248153618907,
4228
+ "grad_norm": 2.3733905521598353,
4229
+ "learning_rate": 7.724185200199643e-05,
4230
+ "loss": 0.2678,
4231
+ "num_input_tokens_seen": 24662336,
4232
+ "step": 2375
4233
+ },
4234
+ {
4235
+ "epoch": 0.7031019202363368,
4236
+ "grad_norm": 6.930201726148201,
4237
+ "learning_rate": 7.713936230373491e-05,
4238
+ "loss": 0.2888,
4239
+ "num_input_tokens_seen": 24714032,
4240
+ "step": 2380
4241
+ },
4242
+ {
4243
+ "epoch": 0.7045790251107829,
4244
+ "grad_norm": 1.2305357870388025,
4245
+ "learning_rate": 7.703671069231007e-05,
4246
+ "loss": 0.2609,
4247
+ "num_input_tokens_seen": 24765296,
4248
+ "step": 2385
4249
+ },
4250
+ {
4251
+ "epoch": 0.7060561299852289,
4252
+ "grad_norm": 1.3830979392967684,
4253
+ "learning_rate": 7.693389778014037e-05,
4254
+ "loss": 0.2654,
4255
+ "num_input_tokens_seen": 24816744,
4256
+ "step": 2390
4257
+ },
4258
+ {
4259
+ "epoch": 0.707533234859675,
4260
+ "grad_norm": 1.641476112098168,
4261
+ "learning_rate": 7.683092418060664e-05,
4262
+ "loss": 0.2231,
4263
+ "num_input_tokens_seen": 24869320,
4264
+ "step": 2395
4265
+ },
4266
+ {
4267
+ "epoch": 0.7090103397341211,
4268
+ "grad_norm": 9.651892844655563,
4269
+ "learning_rate": 7.672779050804834e-05,
4270
+ "loss": 0.262,
4271
+ "num_input_tokens_seen": 24921872,
4272
+ "step": 2400
4273
+ },
4274
+ {
4275
+ "epoch": 0.7090103397341211,
4276
+ "eval_loss": 0.34713664650917053,
4277
+ "eval_runtime": 18.9635,
4278
+ "eval_samples_per_second": 3.164,
4279
+ "eval_steps_per_second": 0.791,
4280
+ "num_input_tokens_seen": 24921872,
4281
+ "step": 2400
4282
  }
4283
  ],
4284
  "logging_steps": 5,
4285
  "max_steps": 6770,
4286
+ "num_input_tokens_seen": 24921872,
4287
  "num_train_epochs": 2,
4288
  "save_steps": 50,
4289
  "stateful_callbacks": {
 
4298
  "attributes": {}
4299
  }
4300
  },
4301
+ "total_flos": 1644216510578688.0,
4302
  "train_batch_size": 1,
4303
  "trial_name": null,
4304
  "trial_params": null