polejowska commited on
Commit
9a96f10
·
1 Parent(s): 4df5b74

End of training

Browse files
runs/Mar01_15-17-11_Agatas-MacBook-Pro.local/events.out.tfevents.1677680237.Agatas-MacBook-Pro.local.35252.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c67068337a66b39d8540e6d6bb0dd7eae024b0eff29c515cef5f7e071346d4a3
3
- size 5349
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64e9e952743a801af12e09c88fc07511330ff69222a97792b6f541e8e57d6e1
3
+ size 5703
trainer_state.json CHANGED
@@ -9,40 +9,40 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "learning_rate": 5e-05,
13
- "loss": 6.9121,
14
  "step": 94
15
  },
16
  {
17
  "epoch": 1.0,
18
- "eval_loss": 4.612173557281494,
19
- "eval_runtime": 71.058,
20
- "eval_samples_per_second": 2.815,
21
- "eval_steps_per_second": 0.352,
22
  "step": 94
23
  },
24
  {
25
  "epoch": 2.0,
26
  "learning_rate": 0.0,
27
- "loss": 5.9062,
28
  "step": 188
29
  },
30
  {
31
  "epoch": 2.0,
32
- "eval_loss": 4.612091541290283,
33
- "eval_runtime": 71.351,
34
- "eval_samples_per_second": 2.803,
35
- "eval_steps_per_second": 0.35,
36
  "step": 188
37
  },
38
  {
39
  "epoch": 2.0,
40
  "step": 188,
41
  "total_flos": 6.168280896e+17,
42
- "train_loss": 6.409146572681183,
43
- "train_runtime": 1163.2401,
44
- "train_samples_per_second": 1.29,
45
- "train_steps_per_second": 0.162
46
  }
47
  ],
48
  "max_steps": 188,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "learning_rate": 0.0005,
13
+ "loss": 5.9448,
14
  "step": 94
15
  },
16
  {
17
  "epoch": 1.0,
18
+ "eval_loss": 4.646627902984619,
19
+ "eval_runtime": 70.2506,
20
+ "eval_samples_per_second": 2.847,
21
+ "eval_steps_per_second": 0.356,
22
  "step": 94
23
  },
24
  {
25
  "epoch": 2.0,
26
  "learning_rate": 0.0,
27
+ "loss": 4.6291,
28
  "step": 188
29
  },
30
  {
31
  "epoch": 2.0,
32
+ "eval_loss": 4.621755123138428,
33
+ "eval_runtime": 70.6527,
34
+ "eval_samples_per_second": 2.831,
35
+ "eval_steps_per_second": 0.354,
36
  "step": 188
37
  },
38
  {
39
  "epoch": 2.0,
40
  "step": 188,
41
  "total_flos": 6.168280896e+17,
42
+ "train_loss": 5.2869415283203125,
43
+ "train_runtime": 1145.3249,
44
+ "train_samples_per_second": 1.31,
45
+ "train_steps_per_second": 0.164
46
  }
47
  ],
48
  "max_steps": 188,