TachyHealthResearch commited on
Commit
ce271be
1 Parent(s): bd79f13

Training in progress, step 150, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f167e9c776981f1c22ea8e02bd3d6330f283765cdc95160c57bf1aa04b11fc3
3
  size 65309632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c03ace3b99cc514c0e944aee1e66c1502ae598126c038b1132c77ee479b4ecf1
3
  size 65309632
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1a24463f21742aa34fbe27e76072eddf69fe74138488e58902342a74fbf36c7
3
  size 32995412
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76ed15de62911a974471aa555c5ebe2229e3ac95a886708c4532492725d1106a
3
  size 32995412
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f0cb6895b198d17891374cd93d94b45d251baef41691c82d99fe270719eae2d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c7228b5760789e32d617ca96daf0a009e462f257ac0e66d0b616a8df253a53
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9702192071987640411db8cd497f9de57450f22a9586d9cce5affbc116fe7983
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194456d3c9e165255d5406a0f3f62973b0bede79d91784f72431350783e27ae7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.056,
5
  "eval_steps": 1000,
6
- "global_step": 140,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -847,13 +847,73 @@
847
  "learning_rate": 1.3793103448275863e-05,
848
  "loss": 2.1258,
849
  "step": 140
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
850
  }
851
  ],
852
  "logging_steps": 1,
853
  "max_steps": 150,
854
  "num_train_epochs": 1,
855
  "save_steps": 10,
856
- "total_flos": 7472731954317312.0,
857
  "trial_name": null,
858
  "trial_params": null
859
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.06,
5
  "eval_steps": 1000,
6
+ "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
847
  "learning_rate": 1.3793103448275863e-05,
848
  "loss": 2.1258,
849
  "step": 140
850
+ },
851
+ {
852
+ "epoch": 0.06,
853
+ "learning_rate": 1.2413793103448277e-05,
854
+ "loss": 1.9039,
855
+ "step": 141
856
+ },
857
+ {
858
+ "epoch": 0.06,
859
+ "learning_rate": 1.103448275862069e-05,
860
+ "loss": 1.8506,
861
+ "step": 142
862
+ },
863
+ {
864
+ "epoch": 0.06,
865
+ "learning_rate": 9.655172413793103e-06,
866
+ "loss": 1.7843,
867
+ "step": 143
868
+ },
869
+ {
870
+ "epoch": 0.06,
871
+ "learning_rate": 8.275862068965518e-06,
872
+ "loss": 1.9734,
873
+ "step": 144
874
+ },
875
+ {
876
+ "epoch": 0.06,
877
+ "learning_rate": 6.896551724137932e-06,
878
+ "loss": 2.0637,
879
+ "step": 145
880
+ },
881
+ {
882
+ "epoch": 0.06,
883
+ "learning_rate": 5.517241379310345e-06,
884
+ "loss": 1.9301,
885
+ "step": 146
886
+ },
887
+ {
888
+ "epoch": 0.06,
889
+ "learning_rate": 4.137931034482759e-06,
890
+ "loss": 1.9931,
891
+ "step": 147
892
+ },
893
+ {
894
+ "epoch": 0.06,
895
+ "learning_rate": 2.7586206896551725e-06,
896
+ "loss": 1.9537,
897
+ "step": 148
898
+ },
899
+ {
900
+ "epoch": 0.06,
901
+ "learning_rate": 1.3793103448275862e-06,
902
+ "loss": 2.0301,
903
+ "step": 149
904
+ },
905
+ {
906
+ "epoch": 0.06,
907
+ "learning_rate": 0.0,
908
+ "loss": 1.7689,
909
+ "step": 150
910
  }
911
  ],
912
  "logging_steps": 1,
913
  "max_steps": 150,
914
  "num_train_epochs": 1,
915
  "save_steps": 10,
916
+ "total_flos": 8076780710022144.0,
917
  "trial_name": null,
918
  "trial_params": null
919
  }