ben81828 commited on
Commit
91704ee
·
verified ·
1 Parent(s): c11cc4d

Training in progress, step 1950, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbfd21913024836a541ea9e4804a4fbd723ce6bc0181f6257333676058a340fa
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24258a1c284f2e5e09aacf01faee241dabd7ef5ca96fece0a7b0849d7edeb577
3
  size 29034840
last-checkpoint/global_step1950/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82aaadf47a144b788872e51c6a1a6007fefeb003f4d352eec1a00254d36c6ab0
3
+ size 43429616
last-checkpoint/global_step1950/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ee1eaee89ef24958e4b33fdc1d3cec1bfe7cce8494a7d935d11b9bc5cba7900
3
+ size 43429616
last-checkpoint/global_step1950/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a797afc790c7358ad676cbc51801b99f9ba67cb6d009bd651f4001d6e45420c0
3
+ size 43429616
last-checkpoint/global_step1950/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5ae1f1f5991994465ba8432397478cdc71281b6497781452a906eb68d626072
3
+ size 43429616
last-checkpoint/global_step1950/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec2eee1c827b58b94cbb0ba0dc8b44f046c8cbab8f4d8f244be51bf3c1e0a3db
3
+ size 637299
last-checkpoint/global_step1950/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc9e2862ddf9da9018e498cb0ddaff309c1fe0955553cb6c40835a940701d96e
3
+ size 637171
last-checkpoint/global_step1950/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a8aeb2a9ee16658bc362ef45e432893c9c07e02ea21b64f97648ac7042f7216
3
+ size 637171
last-checkpoint/global_step1950/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:075ee02aba76263bff18e95eb0d231f36fef41bdacc3184f2e24255758e4ea16
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1900
 
1
+ global_step1950
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:585b8316bac42fce8431ad71be5542adc79fdd5ff1839401f8374f6ab8226086
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a12f59c32c769438d50dc0cafe27e6fc40938bdddec36889a5df342054ce351e
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc4c7cc343f6d985da07523b86ffd7b02d0b8ae40ff925936c48aff8a7385f39
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adfe49ca065b2692ef1b5fa1d31070f7f1bd192ca458adb37564630382a34304
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b364386e5b3618cb74f99527a8e31fa3c7d8d93018d2d0cf0b819ae4c3c1794b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2128704174ab99852922ed60f853889db68df441b0349c973ed4e07336cfce8e
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed71fe0f2fd47c414d9fd305b847e65b2f95946543d7b867318fdc05f761e6bc
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:090480cd9b6a50ca427e61698c04a96bcef20285d14b3963931e7e5bf69fddf8
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1638a0d8fae0cac9f51058dc27d95044277961dbc065df33adbdd1c6ae671a0d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a323a8ccf8ef79a414d4a8cf4f36b33f1f113b5c5ffb8de9538d61f0bfd4dcd6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.28714123368263245,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-1550",
4
- "epoch": 0.5612998522895125,
5
  "eval_steps": 50,
6
- "global_step": 1900,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -3389,11 +3389,100 @@
3389
  "eval_steps_per_second": 0.773,
3390
  "num_input_tokens_seen": 19735976,
3391
  "step": 1900
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3392
  }
3393
  ],
3394
  "logging_steps": 5,
3395
  "max_steps": 6770,
3396
- "num_input_tokens_seen": 19735976,
3397
  "num_train_epochs": 2,
3398
  "save_steps": 50,
3399
  "stateful_callbacks": {
@@ -3408,7 +3497,7 @@
3408
  "attributes": {}
3409
  }
3410
  },
3411
- "total_flos": 1302030401404928.0,
3412
  "train_batch_size": 1,
3413
  "trial_name": null,
3414
  "trial_params": null
 
1
  {
2
  "best_metric": 0.28714123368263245,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_direction_then_DetectAndClassify_scale6/lora/sft/checkpoint-1550",
4
+ "epoch": 0.5760709010339734,
5
  "eval_steps": 50,
6
+ "global_step": 1950,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
3389
  "eval_steps_per_second": 0.773,
3390
  "num_input_tokens_seen": 19735976,
3391
  "step": 1900
3392
+ },
3393
+ {
3394
+ "epoch": 0.5627769571639586,
3395
+ "grad_norm": 7.406464018339625,
3396
+ "learning_rate": 8.606901505441718e-05,
3397
+ "loss": 0.3128,
3398
+ "num_input_tokens_seen": 19787504,
3399
+ "step": 1905
3400
+ },
3401
+ {
3402
+ "epoch": 0.5642540620384048,
3403
+ "grad_norm": 2.9136695732910467,
3404
+ "learning_rate": 8.598432987897565e-05,
3405
+ "loss": 0.2711,
3406
+ "num_input_tokens_seen": 19839104,
3407
+ "step": 1910
3408
+ },
3409
+ {
3410
+ "epoch": 0.5657311669128509,
3411
+ "grad_norm": 16.37365104368587,
3412
+ "learning_rate": 8.589943002138295e-05,
3413
+ "loss": 0.3735,
3414
+ "num_input_tokens_seen": 19891064,
3415
+ "step": 1915
3416
+ },
3417
+ {
3418
+ "epoch": 0.5672082717872969,
3419
+ "grad_norm": 12.090734435687315,
3420
+ "learning_rate": 8.581431598815077e-05,
3421
+ "loss": 0.29,
3422
+ "num_input_tokens_seen": 19942368,
3423
+ "step": 1920
3424
+ },
3425
+ {
3426
+ "epoch": 0.568685376661743,
3427
+ "grad_norm": 2.098717687702263,
3428
+ "learning_rate": 8.572898828706857e-05,
3429
+ "loss": 0.2977,
3430
+ "num_input_tokens_seen": 19994816,
3431
+ "step": 1925
3432
+ },
3433
+ {
3434
+ "epoch": 0.5701624815361891,
3435
+ "grad_norm": 8.108786754862253,
3436
+ "learning_rate": 8.564344742720059e-05,
3437
+ "loss": 0.2483,
3438
+ "num_input_tokens_seen": 20046192,
3439
+ "step": 1930
3440
+ },
3441
+ {
3442
+ "epoch": 0.5716395864106352,
3443
+ "grad_norm": 32.34891985769585,
3444
+ "learning_rate": 8.55576939188827e-05,
3445
+ "loss": 0.3126,
3446
+ "num_input_tokens_seen": 20097328,
3447
+ "step": 1935
3448
+ },
3449
+ {
3450
+ "epoch": 0.5731166912850812,
3451
+ "grad_norm": 10.903589696110263,
3452
+ "learning_rate": 8.54717282737195e-05,
3453
+ "loss": 0.2688,
3454
+ "num_input_tokens_seen": 20149392,
3455
+ "step": 1940
3456
+ },
3457
+ {
3458
+ "epoch": 0.5745937961595273,
3459
+ "grad_norm": 1.6351631003571967,
3460
+ "learning_rate": 8.538555100458114e-05,
3461
+ "loss": 0.2491,
3462
+ "num_input_tokens_seen": 20201392,
3463
+ "step": 1945
3464
+ },
3465
+ {
3466
+ "epoch": 0.5760709010339734,
3467
+ "grad_norm": 13.847094678250938,
3468
+ "learning_rate": 8.529916262560038e-05,
3469
+ "loss": 0.2992,
3470
+ "num_input_tokens_seen": 20253288,
3471
+ "step": 1950
3472
+ },
3473
+ {
3474
+ "epoch": 0.5760709010339734,
3475
+ "eval_loss": 0.3468088209629059,
3476
+ "eval_runtime": 19.3874,
3477
+ "eval_samples_per_second": 3.095,
3478
+ "eval_steps_per_second": 0.774,
3479
+ "num_input_tokens_seen": 20253288,
3480
+ "step": 1950
3481
  }
3482
  ],
3483
  "logging_steps": 5,
3484
  "max_steps": 6770,
3485
+ "num_input_tokens_seen": 20253288,
3486
  "num_train_epochs": 2,
3487
  "save_steps": 50,
3488
  "stateful_callbacks": {
 
3497
  "attributes": {}
3498
  }
3499
  },
3500
+ "total_flos": 1336194242183168.0,
3501
  "train_batch_size": 1,
3502
  "trial_name": null,
3503
  "trial_params": null