ben81828 commited on
Commit
11b142a
·
verified ·
1 Parent(s): b639496

Training in progress, step 2350, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee4d20084c020812db6dbd79fbf4828c8db14c421e8619ec1b2d21ffca81b370
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e895c1cddd40eb0dbe387456240309b06d66fe014fd793905368c3b37bbbff4a
3
  size 29034840
last-checkpoint/global_step2350/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64eef91b1c41414b86c1c79785e71b08863e11060ff8cc3ef7864e7ebdfd9ea
3
+ size 43429616
last-checkpoint/global_step2350/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e5375885f162d12b5216a73c6bb52338439850ad1e62fb1c7c0c1edab8bc406
3
+ size 43429616
last-checkpoint/global_step2350/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9591fd0143ecbd5381bf4045248702d04a33777473a65e109ac0ff4e0b72032
3
+ size 43429616
last-checkpoint/global_step2350/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f2bea725eb09303fe4967379db3c2f97314752353eb0873dd28f22e85954261
3
+ size 43429616
last-checkpoint/global_step2350/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ea2f1422947988eee2012dbb023c20b562004f04b0280a6b2e02eb0104df6c
3
+ size 637299
last-checkpoint/global_step2350/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d2de4b133830a36a27f5675bcfb3196e62844d0ea6515c1da4410138b5a0d55
3
+ size 637171
last-checkpoint/global_step2350/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efb4f0a348ba8ed1a0f899c6bd11b00341b3cb75bef3c71ead62d8cdd2a38d6d
3
+ size 637171
last-checkpoint/global_step2350/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddee7cdbd3744f566b1d3de4032edc8a6be338074790be0b4e6dd344c41978e2
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step2300
 
1
+ global_step2350
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d25cbcbbaa0866ea9c7365cb49b84e805db119693e615f5a1898a6ebfe997e8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f12bf3da75454e5aae4644f2a1d46fdf90f68e680dbf5bdaa86861f825d32d80
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a883389afac12125c2c6bf62631b7de0220fdb0020d24cd0c6e8f8858dd3b362
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2faef1b8798e7516fd96ee7b3363866a8f97ca2d0ec5a8dd27bbfe70b0c6a733
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:577d49de6d60035e159d9ebb1e6eabef79a55787b14ecea93a6a93c242661779
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f35f6d27fbd414dd4285d91816b37fb6b97ff10fbba4c074d56ad2a7f723033
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5f2dd1c21e06806a9ce39eeab45734dfb8a62b829f91a86d1f65f13102d6242
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea5c64dfc7e3b2729065483dfef8e4bb0af0d9bae32df888d258ee3c2859d676
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4affa863c39f4a87a7aa62bb6d8ea5d9ce72773cba2b4ccffc763273823a37b1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8d0442374b2f8618569ef196bfe7955aa6b552a4eb29da5972e99b6fb6a7877
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.24180778861045837,
3
- "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2300",
4
- "epoch": 0.6794682422451994,
5
  "eval_steps": 50,
6
- "global_step": 2300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4101,11 +4101,100 @@
4101
  "eval_steps_per_second": 0.791,
4102
  "num_input_tokens_seen": 23883032,
4103
  "step": 2300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4104
  }
4105
  ],
4106
  "logging_steps": 5,
4107
  "max_steps": 6770,
4108
- "num_input_tokens_seen": 23883032,
4109
  "num_train_epochs": 2,
4110
  "save_steps": 50,
4111
  "stateful_callbacks": {
@@ -4120,7 +4209,7 @@
4120
  "attributes": {}
4121
  }
4122
  },
4123
- "total_flos": 1575723931533312.0,
4124
  "train_batch_size": 1,
4125
  "trial_name": null,
4126
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.1869634985923767,
3
+ "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-2350",
4
+ "epoch": 0.6942392909896603,
5
  "eval_steps": 50,
6
+ "global_step": 2350,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4101
  "eval_steps_per_second": 0.791,
4102
  "num_input_tokens_seen": 23883032,
4103
  "step": 2300
4104
+ },
4105
+ {
4106
+ "epoch": 0.6809453471196455,
4107
+ "grad_norm": 15.468575933907964,
4108
+ "learning_rate": 7.865936626267243e-05,
4109
+ "loss": 0.2474,
4110
+ "num_input_tokens_seen": 23934880,
4111
+ "step": 2305
4112
+ },
4113
+ {
4114
+ "epoch": 0.6824224519940916,
4115
+ "grad_norm": 3.9259269918244932,
4116
+ "learning_rate": 7.855920710508009e-05,
4117
+ "loss": 0.2613,
4118
+ "num_input_tokens_seen": 23986160,
4119
+ "step": 2310
4120
+ },
4121
+ {
4122
+ "epoch": 0.6838995568685377,
4123
+ "grad_norm": 1.443222642921112,
4124
+ "learning_rate": 7.845887756354458e-05,
4125
+ "loss": 0.1957,
4126
+ "num_input_tokens_seen": 24038984,
4127
+ "step": 2315
4128
+ },
4129
+ {
4130
+ "epoch": 0.6853766617429837,
4131
+ "grad_norm": 2.418773014069429,
4132
+ "learning_rate": 7.835837823663092e-05,
4133
+ "loss": 0.2709,
4134
+ "num_input_tokens_seen": 24090648,
4135
+ "step": 2320
4136
+ },
4137
+ {
4138
+ "epoch": 0.6868537666174298,
4139
+ "grad_norm": 1.2678547091245644,
4140
+ "learning_rate": 7.825770972391712e-05,
4141
+ "loss": 0.2873,
4142
+ "num_input_tokens_seen": 24142200,
4143
+ "step": 2325
4144
+ },
4145
+ {
4146
+ "epoch": 0.6883308714918759,
4147
+ "grad_norm": 1.5899740505737827,
4148
+ "learning_rate": 7.81568726259905e-05,
4149
+ "loss": 0.2378,
4150
+ "num_input_tokens_seen": 24194400,
4151
+ "step": 2330
4152
+ },
4153
+ {
4154
+ "epoch": 0.689807976366322,
4155
+ "grad_norm": 1.6209911075093861,
4156
+ "learning_rate": 7.805586754444416e-05,
4157
+ "loss": 0.2615,
4158
+ "num_input_tokens_seen": 24245328,
4159
+ "step": 2335
4160
+ },
4161
+ {
4162
+ "epoch": 0.691285081240768,
4163
+ "grad_norm": 16.06254938606901,
4164
+ "learning_rate": 7.795469508187343e-05,
4165
+ "loss": 0.2234,
4166
+ "num_input_tokens_seen": 24297400,
4167
+ "step": 2340
4168
+ },
4169
+ {
4170
+ "epoch": 0.6927621861152142,
4171
+ "grad_norm": 2.2353075576651085,
4172
+ "learning_rate": 7.785335584187219e-05,
4173
+ "loss": 0.2833,
4174
+ "num_input_tokens_seen": 24348536,
4175
+ "step": 2345
4176
+ },
4177
+ {
4178
+ "epoch": 0.6942392909896603,
4179
+ "grad_norm": 11.321777956495533,
4180
+ "learning_rate": 7.775185042902933e-05,
4181
+ "loss": 0.2313,
4182
+ "num_input_tokens_seen": 24401256,
4183
+ "step": 2350
4184
+ },
4185
+ {
4186
+ "epoch": 0.6942392909896603,
4187
+ "eval_loss": 0.1869634985923767,
4188
+ "eval_runtime": 19.499,
4189
+ "eval_samples_per_second": 3.077,
4190
+ "eval_steps_per_second": 0.769,
4191
+ "num_input_tokens_seen": 24401256,
4192
+ "step": 2350
4193
  }
4194
  ],
4195
  "logging_steps": 5,
4196
  "max_steps": 6770,
4197
+ "num_input_tokens_seen": 24401256,
4198
  "num_train_epochs": 2,
4199
  "save_steps": 50,
4200
  "stateful_callbacks": {
 
4209
  "attributes": {}
4210
  }
4211
  },
4212
+ "total_flos": 1609869937344512.0,
4213
  "train_batch_size": 1,
4214
  "trial_name": null,
4215
  "trial_params": null