polejowska
commited on
Commit
·
9a96f10
1
Parent(s):
4df5b74
End of training
Browse files
runs/Mar01_15-17-11_Agatas-MacBook-Pro.local/events.out.tfevents.1677680237.Agatas-MacBook-Pro.local.35252.2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b64e9e952743a801af12e09c88fc07511330ff69222a97792b6f541e8e57d6e1
|
3 |
+
size 5703
|
trainer_state.json
CHANGED
@@ -9,40 +9,40 @@
|
|
9 |
"log_history": [
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
-
"learning_rate":
|
13 |
-
"loss":
|
14 |
"step": 94
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
-
"eval_loss": 4.
|
19 |
-
"eval_runtime":
|
20 |
-
"eval_samples_per_second": 2.
|
21 |
-
"eval_steps_per_second": 0.
|
22 |
"step": 94
|
23 |
},
|
24 |
{
|
25 |
"epoch": 2.0,
|
26 |
"learning_rate": 0.0,
|
27 |
-
"loss":
|
28 |
"step": 188
|
29 |
},
|
30 |
{
|
31 |
"epoch": 2.0,
|
32 |
-
"eval_loss": 4.
|
33 |
-
"eval_runtime":
|
34 |
-
"eval_samples_per_second": 2.
|
35 |
-
"eval_steps_per_second": 0.
|
36 |
"step": 188
|
37 |
},
|
38 |
{
|
39 |
"epoch": 2.0,
|
40 |
"step": 188,
|
41 |
"total_flos": 6.168280896e+17,
|
42 |
-
"train_loss":
|
43 |
-
"train_runtime":
|
44 |
-
"train_samples_per_second": 1.
|
45 |
-
"train_steps_per_second": 0.
|
46 |
}
|
47 |
],
|
48 |
"max_steps": 188,
|
|
|
9 |
"log_history": [
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
+
"learning_rate": 0.0005,
|
13 |
+
"loss": 5.9448,
|
14 |
"step": 94
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
+
"eval_loss": 4.646627902984619,
|
19 |
+
"eval_runtime": 70.2506,
|
20 |
+
"eval_samples_per_second": 2.847,
|
21 |
+
"eval_steps_per_second": 0.356,
|
22 |
"step": 94
|
23 |
},
|
24 |
{
|
25 |
"epoch": 2.0,
|
26 |
"learning_rate": 0.0,
|
27 |
+
"loss": 4.6291,
|
28 |
"step": 188
|
29 |
},
|
30 |
{
|
31 |
"epoch": 2.0,
|
32 |
+
"eval_loss": 4.621755123138428,
|
33 |
+
"eval_runtime": 70.6527,
|
34 |
+
"eval_samples_per_second": 2.831,
|
35 |
+
"eval_steps_per_second": 0.354,
|
36 |
"step": 188
|
37 |
},
|
38 |
{
|
39 |
"epoch": 2.0,
|
40 |
"step": 188,
|
41 |
"total_flos": 6.168280896e+17,
|
42 |
+
"train_loss": 5.2869415283203125,
|
43 |
+
"train_runtime": 1145.3249,
|
44 |
+
"train_samples_per_second": 1.31,
|
45 |
+
"train_steps_per_second": 0.164
|
46 |
}
|
47 |
],
|
48 |
"max_steps": 188,
|