End of training
Browse files- all_results.json +7 -7
- eval_results.json +3 -3
- train_results.json +4 -4
- trainer_state.json +19 -19
all_results.json
CHANGED
@@ -2,11 +2,11 @@
|
|
2 |
"epoch": 5.0,
|
3 |
"eval_accuracy": 0.9849624060150376,
|
4 |
"eval_loss": 0.08750259131193161,
|
5 |
-
"eval_runtime":
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second":
|
8 |
-
"train_loss": 0.
|
9 |
-
"train_runtime":
|
10 |
-
"train_samples_per_second":
|
11 |
-
"train_steps_per_second":
|
12 |
}
|
|
|
2 |
"epoch": 5.0,
|
3 |
"eval_accuracy": 0.9849624060150376,
|
4 |
"eval_loss": 0.08750259131193161,
|
5 |
+
"eval_runtime": 0.7758,
|
6 |
+
"eval_samples_per_second": 171.437,
|
7 |
+
"eval_steps_per_second": 21.913,
|
8 |
+
"train_loss": 0.23564630480913015,
|
9 |
+
"train_runtime": 101.4306,
|
10 |
+
"train_samples_per_second": 50.971,
|
11 |
+
"train_steps_per_second": 6.408
|
12 |
}
|
eval_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 5.0,
|
3 |
"eval_accuracy": 0.9849624060150376,
|
4 |
"eval_loss": 0.08750259131193161,
|
5 |
-
"eval_runtime":
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second":
|
8 |
}
|
|
|
2 |
"epoch": 5.0,
|
3 |
"eval_accuracy": 0.9849624060150376,
|
4 |
"eval_loss": 0.08750259131193161,
|
5 |
+
"eval_runtime": 0.7758,
|
6 |
+
"eval_samples_per_second": 171.437,
|
7 |
+
"eval_steps_per_second": 21.913
|
8 |
}
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second":
|
6 |
-
"train_steps_per_second":
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
+
"train_loss": 0.23564630480913015,
|
4 |
+
"train_runtime": 101.4306,
|
5 |
+
"train_samples_per_second": 50.971,
|
6 |
+
"train_steps_per_second": 6.408
|
7 |
}
|
trainer_state.json
CHANGED
@@ -89,9 +89,9 @@
|
|
89 |
"epoch": 1.0,
|
90 |
"eval_accuracy": 0.9624060150375939,
|
91 |
"eval_loss": 0.23068006336688995,
|
92 |
-
"eval_runtime": 0.
|
93 |
-
"eval_samples_per_second":
|
94 |
-
"eval_steps_per_second":
|
95 |
"step": 130
|
96 |
},
|
97 |
{
|
@@ -176,9 +176,9 @@
|
|
176 |
"epoch": 2.0,
|
177 |
"eval_accuracy": 0.9924812030075187,
|
178 |
"eval_loss": 0.11085593700408936,
|
179 |
-
"eval_runtime": 0.
|
180 |
-
"eval_samples_per_second":
|
181 |
-
"eval_steps_per_second":
|
182 |
"step": 260
|
183 |
},
|
184 |
{
|
@@ -263,9 +263,9 @@
|
|
263 |
"epoch": 3.0,
|
264 |
"eval_accuracy": 0.9699248120300752,
|
265 |
"eval_loss": 0.1108752116560936,
|
266 |
-
"eval_runtime": 0.
|
267 |
-
"eval_samples_per_second":
|
268 |
-
"eval_steps_per_second":
|
269 |
"step": 390
|
270 |
},
|
271 |
{
|
@@ -350,9 +350,9 @@
|
|
350 |
"epoch": 4.0,
|
351 |
"eval_accuracy": 0.9849624060150376,
|
352 |
"eval_loss": 0.08750259131193161,
|
353 |
-
"eval_runtime": 0.
|
354 |
-
"eval_samples_per_second":
|
355 |
-
"eval_steps_per_second": 22.
|
356 |
"step": 520
|
357 |
},
|
358 |
{
|
@@ -437,19 +437,19 @@
|
|
437 |
"epoch": 5.0,
|
438 |
"eval_accuracy": 0.9774436090225563,
|
439 |
"eval_loss": 0.08863506466150284,
|
440 |
-
"eval_runtime": 0.
|
441 |
-
"eval_samples_per_second":
|
442 |
-
"eval_steps_per_second":
|
443 |
"step": 650
|
444 |
},
|
445 |
{
|
446 |
"epoch": 5.0,
|
447 |
"step": 650,
|
448 |
"total_flos": 4.006371770595533e+17,
|
449 |
-
"train_loss": 0.
|
450 |
-
"train_runtime":
|
451 |
-
"train_samples_per_second":
|
452 |
-
"train_steps_per_second":
|
453 |
}
|
454 |
],
|
455 |
"max_steps": 650,
|
|
|
89 |
"epoch": 1.0,
|
90 |
"eval_accuracy": 0.9624060150375939,
|
91 |
"eval_loss": 0.23068006336688995,
|
92 |
+
"eval_runtime": 0.7854,
|
93 |
+
"eval_samples_per_second": 169.35,
|
94 |
+
"eval_steps_per_second": 21.646,
|
95 |
"step": 130
|
96 |
},
|
97 |
{
|
|
|
176 |
"epoch": 2.0,
|
177 |
"eval_accuracy": 0.9924812030075187,
|
178 |
"eval_loss": 0.11085593700408936,
|
179 |
+
"eval_runtime": 0.7261,
|
180 |
+
"eval_samples_per_second": 183.181,
|
181 |
+
"eval_steps_per_second": 23.414,
|
182 |
"step": 260
|
183 |
},
|
184 |
{
|
|
|
263 |
"epoch": 3.0,
|
264 |
"eval_accuracy": 0.9699248120300752,
|
265 |
"eval_loss": 0.1108752116560936,
|
266 |
+
"eval_runtime": 0.7271,
|
267 |
+
"eval_samples_per_second": 182.92,
|
268 |
+
"eval_steps_per_second": 23.381,
|
269 |
"step": 390
|
270 |
},
|
271 |
{
|
|
|
350 |
"epoch": 4.0,
|
351 |
"eval_accuracy": 0.9849624060150376,
|
352 |
"eval_loss": 0.08750259131193161,
|
353 |
+
"eval_runtime": 0.7445,
|
354 |
+
"eval_samples_per_second": 178.634,
|
355 |
+
"eval_steps_per_second": 22.833,
|
356 |
"step": 520
|
357 |
},
|
358 |
{
|
|
|
437 |
"epoch": 5.0,
|
438 |
"eval_accuracy": 0.9774436090225563,
|
439 |
"eval_loss": 0.08863506466150284,
|
440 |
+
"eval_runtime": 0.7378,
|
441 |
+
"eval_samples_per_second": 180.271,
|
442 |
+
"eval_steps_per_second": 23.042,
|
443 |
"step": 650
|
444 |
},
|
445 |
{
|
446 |
"epoch": 5.0,
|
447 |
"step": 650,
|
448 |
"total_flos": 4.006371770595533e+17,
|
449 |
+
"train_loss": 0.23564630480913015,
|
450 |
+
"train_runtime": 101.4306,
|
451 |
+
"train_samples_per_second": 50.971,
|
452 |
+
"train_steps_per_second": 6.408
|
453 |
}
|
454 |
],
|
455 |
"max_steps": 650,
|