evgmaslov commited on
Commit
0318512
1 Parent(s): 3d2c017

Training in progress, step 1059, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98aba24d1fe4652cee536ec017bb74b497838690e6de4456baf5305851f862f4
3
  size 109069176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8dbcd3f2df87fa92f8c899ddd99a7a6c3361ecf1f3155dc729ee2e7204c9de
3
  size 109069176
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb2e7b42bc59f5b6aa4a5aeb586f71702394b8c3f62d1b520ed222f9d9706b08
3
  size 218182650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16473a4a6a91f910c8d6460a31ebf3018f1d556a00c8894fd497fdbd0c3817ff
3
  size 218182650
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2a3f6ceea2a0c9b0a500f11618e34dcda55772c2b889eddbd0f6523933bb590
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f85bbc24f38c28541cca3607d5926e5d091869d2a0e283ee4c798dfc89622000
3
  size 15920
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb503c368b8cd38eae1790c9b004965206255a94fbbd64584d9f2a888f048180
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef342e05caa9e790072cd9bc3d096020932cd1c3586ba855ecc382154f1d26f4
3
  size 15920
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3bff28db7938c4764b9145df1087e8a16b9c33dc6a70a876bd79a3712f247aa
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c9b09861d0574d083d9f8add5c762030220b135e9b8d04d3cfd41e299fc56f6
3
  size 15920
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a358e13bb5878669fb5eaa6aa23b5d5c525855355d5750750c295b657def741f
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305931b158387d9e2e94c3f46229f1645b2f12020d6e57d50a725177eaa7fd98
3
  size 15920
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62924847080e51ab7a41e260d3db9385c7511f5a640bd7e5022f28b05bb46cd3
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75cfa167b8702df7b304cf73deceb2595c3cc08b550b70ebfd5ae62b4f86fa3e
3
  size 15920
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bb3d3ec880046360e8f11ef9d55a0796c3936aac653379d8402f7a9a298d4c4
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ac0ed767bb7fb89b283d5925156d9763d0bc83ec4505e1ff9c992f88905fab8
3
  size 15920
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1628ad4546449d1fc7fbaca4c2024cba05024444c7b5092bfb77893a7bb7a785
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2fe761ed37ead8dca0d14b4837488442a64c5938e29e58e46206f425d8dad5
3
  size 15920
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddb44a8e2baeeb2ea10e0db0e6ed57a39236bcdc289b8fae7a1fa0b0999f2ded
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1f5261d86491fd42a1b2b06153e8ac080f9115914cb858320097db5d4dad5b9
3
  size 15920
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ee76b6323a7876a5231a2afe442ff8854dbbdd9d2119d7ce1bb953ecf9b2892
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:505775f8c54d1f6efb9298789c5e9f519d24f0015cdd570247c62a3cc1047c07
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9442870632672332,
5
  "eval_steps": 100,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -115,12 +115,12 @@
115
  "should_evaluate": false,
116
  "should_log": false,
117
  "should_save": true,
118
- "should_training_stop": false
119
  },
120
  "attributes": {}
121
  }
122
  },
123
- "total_flos": 1.006318585573802e+18,
124
  "train_batch_size": 4,
125
  "trial_name": null,
126
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0,
5
  "eval_steps": 100,
6
+ "global_step": 1059,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
115
  "should_evaluate": false,
116
  "should_log": false,
117
  "should_save": true,
118
+ "should_training_stop": true
119
  },
120
  "attributes": {}
121
  }
122
  },
123
+ "total_flos": 1.0657744835722609e+18,
124
  "train_batch_size": 4,
125
  "trial_name": null,
126
  "trial_params": null