alejndrojavier commited on
Commit
2e21e00
1 Parent(s): f6a6baa

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6352a74e314452393f2a2fcf071c68c935c571007dfbcc47e746cf616a7246a1
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41992a55aa9943c8302d141033b567a11ee530849b4fe2c77b7578e46eaf5a62
3
  size 267832560
tmp-checkpoint-175/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6352a74e314452393f2a2fcf071c68c935c571007dfbcc47e746cf616a7246a1
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41992a55aa9943c8302d141033b567a11ee530849b4fe2c77b7578e46eaf5a62
3
  size 267832560
tmp-checkpoint-175/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:467810065677088ea64b1a84b5d3872a1458ff620639aee59220366634b1d3ea
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f098f42091324014d70498dda49fcd2e57bbc8352875cb37f6b33abafebebd92
3
  size 535727290
tmp-checkpoint-175/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c58ef9a709639d15ce823cbab1c94a327f84302849ffa232663b1d79c1fa4e24
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2799fb355a6059a45cee9f0cd6d7dec02193106ed08b481f241a6fee90738b0d
3
  size 14244
tmp-checkpoint-175/trainer_state.json CHANGED
@@ -11,29 +11,29 @@
11
  {
12
  "epoch": 0.29,
13
  "learning_rate": 1.0000000000000002e-06,
14
- "loss": 0.5522,
15
  "step": 50
16
  },
17
  {
18
  "epoch": 0.57,
19
  "learning_rate": 2.0000000000000003e-06,
20
- "loss": 0.553,
21
  "step": 100
22
  },
23
  {
24
  "epoch": 0.86,
25
  "learning_rate": 3e-06,
26
- "loss": 0.5327,
27
  "step": 150
28
  },
29
  {
30
  "epoch": 1.0,
31
  "eval_accuracy": 0.7685714285714286,
32
  "eval_f1": 0.8691437802907915,
33
- "eval_loss": 0.5155649185180664,
34
- "eval_runtime": 10.9449,
35
- "eval_samples_per_second": 63.957,
36
- "eval_steps_per_second": 4.02,
37
  "step": 175
38
  }
39
  ],
 
11
  {
12
  "epoch": 0.29,
13
  "learning_rate": 1.0000000000000002e-06,
14
+ "loss": 0.5582,
15
  "step": 50
16
  },
17
  {
18
  "epoch": 0.57,
19
  "learning_rate": 2.0000000000000003e-06,
20
+ "loss": 0.5351,
21
  "step": 100
22
  },
23
  {
24
  "epoch": 0.86,
25
  "learning_rate": 3e-06,
26
+ "loss": 0.541,
27
  "step": 150
28
  },
29
  {
30
  "epoch": 1.0,
31
  "eval_accuracy": 0.7685714285714286,
32
  "eval_f1": 0.8691437802907915,
33
+ "eval_loss": 0.5197482705116272,
34
+ "eval_runtime": 11.1124,
35
+ "eval_samples_per_second": 62.992,
36
+ "eval_steps_per_second": 3.96,
37
  "step": 175
38
  }
39
  ],