jssky commited on
Commit
50e8b36
1 Parent(s): e059201

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ba4843bab3f6c0de98cf2828f8059fac627894d15376bf6eb4b6b539d909db8
3
  size 73911112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fff02c7b4a826fb07ea195bb1a7bb4ffc9d721a69210b761baa58148f930fa7
3
  size 73911112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4d523ab2ba4df3c774b98bf6109a8713c9f0199b76bff1f7449efce144029eb
3
  size 37965300
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:319548d2ea9e5b5f008e022dad56cd0f028de3735befddd24f255983fefd537e
3
  size 37965300
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1881ec4d999362af1e52c36de1e218d3800542004d7f7c7edd42a089b7296ccc
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dbb2e8ac6910520ef7694e04efc0c3d22d47c0a6764ae2a666b6a667647ed1d
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00d02bbc0fa1d27820c289ea283e0155cafcbd62fa1759df4850d0a715649da0
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a64ea9853e527aeaa3e3e8ab63280f7a104d71f06cbc00b6586cb1151066797
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c73827ec09ff37ba195a38bf7f08f0537cea0c0a55db5d2fc0d29f759ccdcccb
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb597193ff9d2e676d231c4c21c97756a564739529ec012a7405fe102e2d6bf0
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4822c4ae863c6a81149f37fecf8fc589c5a0e68b5f03747420a5cc6ab7af0d14
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8844277a61aa266c1286de806f9fbc3a0e4ffe07a5d322e90f868a6bef7c6200
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e9b440498b750929a8558219fefc2e4ad160122931aa3d6799fc4f65cdd7304
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:516bda9bd375b4dbffe21ea5098d3ba187c60e9ac82d932b20a8bdf7f85f5e7f
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f0c18fbbe129f61ea282f7dbcc97540666d69c89e3f1cc4842d356efb45d0d6
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6da94ae89efb6930839681ba2aa052a5e83a69a0af729ccfc303f5699e7189e8
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a99554429161338da1a7001f3a511ce540238038412b9c31276e6f7379ad186a
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8788fd8bf5c71109ab3d1b1b8fb5df84005194baadaf8d32a3898477ae2e1c3e
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e39d4edd2882a248daa72fe9c907359ed8ef2a193dbcaec84663291acb998ec0
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b5cb477ad7cfcb7f3e9b4e0628a58437296983ffbd992ed46c97df77959dad1
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c8e6b04902f17ae368c3e6cfd97a31ad4de2f025d673daea8c033ce0e260946
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb578e75c11a81e85dda67a691f96ba4793a02960f1409fd3e1511aac873491a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.0131916452913155,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,13 @@
102
  "eval_samples_per_second": 76.673,
103
  "eval_steps_per_second": 9.601,
104
  "step": 9
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1,
@@ -116,12 +123,12 @@
116
  "should_evaluate": false,
117
  "should_log": false,
118
  "should_save": true,
119
- "should_training_stop": false
120
  },
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 9405135625125888.0,
125
  "train_batch_size": 1,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.014657383657017223,
5
  "eval_steps": 3,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 76.673,
103
  "eval_steps_per_second": 9.601,
104
  "step": 9
105
+ },
106
+ {
107
+ "epoch": 0.014657383657017223,
108
+ "grad_norm": 0.09443683177232742,
109
+ "learning_rate": 0.0002,
110
+ "loss": 0.7131,
111
+ "step": 10
112
  }
113
  ],
114
  "logging_steps": 1,
 
123
  "should_evaluate": false,
124
  "should_log": false,
125
  "should_save": true,
126
+ "should_training_stop": true
127
  },
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 1.045015069458432e+16,
132
  "train_batch_size": 1,
133
  "trial_name": null,
134
  "trial_params": null