Training in progress, step 1201, checkpoint

Files changed (14) hide show

last-checkpoint/adapter_config.json CHANGED Viewed

@@ -19,7 +19,7 @@
   "r": 8,
   "rank_pattern": {},
   "revision": null,
-  "target_modules": "^(?!.*patch_embed).*(?:fc1|fc2|down_proj|proj|qkv|o_proj|q_proj|gate_proj|v_proj|k_proj|up_proj).*",
   "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false

   "r": 8,
   "rank_pattern": {},
   "revision": null,
+  "target_modules": "^(?!.*patch_embed).*(?:gate_proj|qkv|q_proj|fc1|fc2|up_proj|v_proj|down_proj|k_proj|proj|o_proj).*",
   "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:419197c7b895b88c7afacbe056bbf0e1d22ab3d4ba5caafffba674acfa991533
 size 29034840

 version https://git-lfs.github.com/spec/v1
+oid sha256:c8ee2634589442880539cea4215aeae5e195f22dea93b6441497472981b36691
 size 29034840

last-checkpoint/global_step1201/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f2e82372caf676c0b0a5d6293d69692257dd9d7feba954d3cf78ff2a70ae83a
+size 43429616

last-checkpoint/global_step1201/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3dcab03ce19f2ce79a8d53b6ae3f4ac03ac0016d02e59b794c7273852dc5ea6b
+size 43429616

last-checkpoint/global_step1201/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:041435127598402c8acd20dc5a7396b5a683309f402f68fd38fcfe3757dca0d3
+size 43429616

last-checkpoint/global_step1201/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e27d0cc4e7dc7fd4de69c4b1bdcc21d5c4137e83ab060e88c385c55ec12dd8d7
+size 43429616

last-checkpoint/global_step1201/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2075f75ba9a6a574ce7120222ba9095b5c8eb216d857b0767671c01fbc074e7e
+size 637299

last-checkpoint/global_step1201/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6935f4971e1fcb55db5d1f64ef46b459823eff82ade7deff0a5a993f4583bfa7
+size 637171

last-checkpoint/global_step1201/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f9f8f66781db0d1a0637d1dd44b041752fe0978d10f864754f9f8493ed63704
+size 637171

last-checkpoint/global_step1201/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:872a5c568bb2f8cccc429cc5283d43928998853b7318c61f3218fc4c7ef8335f
+size 637171

last-checkpoint/latest CHANGED Viewed

	@@ -1 +1 @@
1	- ~~global_step1200~~


1	+ global_step1201

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:16e0cffc6b063574ed312ee2198c86d3dddf2450d0400f042fdc08bd22dcbc7f
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:3cb88c2bb06d05128047dc279e5c6aaaceeada9fc352a92b1e5300def3533252
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 1.5566551155643538e-05,
   "best_model_checkpoint": "saves/CADICA_qwenvl_direction_scale4/lora/sft/checkpoint-1150",
-  "epoch": 0.6180788050476436,
   "eval_steps": 50,
-  "global_step": 1200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2146,9 +2146,9 @@
     }
   ],
   "logging_steps": 5,
-  "max_steps": 3400,
-  "num_input_tokens_seen": 11980800,
-  "num_train_epochs": 2,
   "save_steps": 50,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -2157,12 +2157,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 790504338096128.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 1.5566551155643538e-05,
   "best_model_checkpoint": "saves/CADICA_qwenvl_direction_scale4/lora/sft/checkpoint-1150",
+  "epoch": 0.6185938707185166,
   "eval_steps": 50,
+  "global_step": 1201,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
     }
   ],
   "logging_steps": 5,
+  "max_steps": 1200,
+  "num_input_tokens_seen": 11990784,
+  "num_train_epochs": 1,
   "save_steps": 50,
   "stateful_callbacks": {
     "TrainerControl": {
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 791107965943808.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3dd22ff474a0bb22d03021b1610996d5087b23b263bba9bcd763538291569b0e
-size 7352

 version https://git-lfs.github.com/spec/v1
+oid sha256:d805df10b9aa9257d71d396f9c297d6e4b0be2e8da8eecef0b7efe313a60a238
+size 7416