leejw51 commited on
Commit
b472ff6
·
1 Parent(s): d0ebe4a

End of training

Browse files
all_results.json CHANGED
@@ -2,11 +2,11 @@
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
- "eval_runtime": 0.7701,
6
- "eval_samples_per_second": 172.714,
7
- "eval_steps_per_second": 22.076,
8
  "train_loss": 0.23564630480913015,
9
- "train_runtime": 86.389,
10
- "train_samples_per_second": 59.846,
11
- "train_steps_per_second": 7.524
12
  }
 
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
+ "eval_runtime": 0.8068,
6
+ "eval_samples_per_second": 164.846,
7
+ "eval_steps_per_second": 21.071,
8
  "train_loss": 0.23564630480913015,
9
+ "train_runtime": 92.709,
10
+ "train_samples_per_second": 55.766,
11
+ "train_steps_per_second": 7.011
12
  }
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
- "eval_runtime": 0.7701,
6
- "eval_samples_per_second": 172.714,
7
- "eval_steps_per_second": 22.076
8
  }
 
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
+ "eval_runtime": 0.8068,
6
+ "eval_samples_per_second": 164.846,
7
+ "eval_steps_per_second": 21.071
8
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 5.0,
3
  "train_loss": 0.23564630480913015,
4
- "train_runtime": 86.389,
5
- "train_samples_per_second": 59.846,
6
- "train_steps_per_second": 7.524
7
  }
 
1
  {
2
  "epoch": 5.0,
3
  "train_loss": 0.23564630480913015,
4
+ "train_runtime": 92.709,
5
+ "train_samples_per_second": 55.766,
6
+ "train_steps_per_second": 7.011
7
  }
trainer_state.json CHANGED
@@ -89,9 +89,9 @@
89
  "epoch": 1.0,
90
  "eval_accuracy": 0.9624060150375939,
91
  "eval_loss": 0.23068006336688995,
92
- "eval_runtime": 0.7405,
93
- "eval_samples_per_second": 179.618,
94
- "eval_steps_per_second": 22.959,
95
  "step": 130
96
  },
97
  {
@@ -176,9 +176,9 @@
176
  "epoch": 2.0,
177
  "eval_accuracy": 0.9924812030075187,
178
  "eval_loss": 0.11085593700408936,
179
- "eval_runtime": 0.7599,
180
- "eval_samples_per_second": 175.032,
181
- "eval_steps_per_second": 22.373,
182
  "step": 260
183
  },
184
  {
@@ -263,9 +263,9 @@
263
  "epoch": 3.0,
264
  "eval_accuracy": 0.9699248120300752,
265
  "eval_loss": 0.1108752116560936,
266
- "eval_runtime": 0.7499,
267
- "eval_samples_per_second": 177.363,
268
- "eval_steps_per_second": 22.67,
269
  "step": 390
270
  },
271
  {
@@ -350,9 +350,9 @@
350
  "epoch": 4.0,
351
  "eval_accuracy": 0.9849624060150376,
352
  "eval_loss": 0.08750259131193161,
353
- "eval_runtime": 0.7317,
354
- "eval_samples_per_second": 181.777,
355
- "eval_steps_per_second": 23.235,
356
  "step": 520
357
  },
358
  {
@@ -437,9 +437,9 @@
437
  "epoch": 5.0,
438
  "eval_accuracy": 0.9774436090225563,
439
  "eval_loss": 0.08863506466150284,
440
- "eval_runtime": 0.7357,
441
- "eval_samples_per_second": 180.787,
442
- "eval_steps_per_second": 23.108,
443
  "step": 650
444
  },
445
  {
@@ -447,9 +447,9 @@
447
  "step": 650,
448
  "total_flos": 4.006371770595533e+17,
449
  "train_loss": 0.23564630480913015,
450
- "train_runtime": 86.389,
451
- "train_samples_per_second": 59.846,
452
- "train_steps_per_second": 7.524
453
  }
454
  ],
455
  "max_steps": 650,
 
89
  "epoch": 1.0,
90
  "eval_accuracy": 0.9624060150375939,
91
  "eval_loss": 0.23068006336688995,
92
+ "eval_runtime": 0.7684,
93
+ "eval_samples_per_second": 173.093,
94
+ "eval_steps_per_second": 22.125,
95
  "step": 130
96
  },
97
  {
 
176
  "epoch": 2.0,
177
  "eval_accuracy": 0.9924812030075187,
178
  "eval_loss": 0.11085593700408936,
179
+ "eval_runtime": 0.7745,
180
+ "eval_samples_per_second": 171.733,
181
+ "eval_steps_per_second": 21.951,
182
  "step": 260
183
  },
184
  {
 
263
  "epoch": 3.0,
264
  "eval_accuracy": 0.9699248120300752,
265
  "eval_loss": 0.1108752116560936,
266
+ "eval_runtime": 0.7607,
267
+ "eval_samples_per_second": 174.831,
268
+ "eval_steps_per_second": 22.347,
269
  "step": 390
270
  },
271
  {
 
350
  "epoch": 4.0,
351
  "eval_accuracy": 0.9849624060150376,
352
  "eval_loss": 0.08750259131193161,
353
+ "eval_runtime": 0.7575,
354
+ "eval_samples_per_second": 175.569,
355
+ "eval_steps_per_second": 22.441,
356
  "step": 520
357
  },
358
  {
 
437
  "epoch": 5.0,
438
  "eval_accuracy": 0.9774436090225563,
439
  "eval_loss": 0.08863506466150284,
440
+ "eval_runtime": 0.7631,
441
+ "eval_samples_per_second": 174.294,
442
+ "eval_steps_per_second": 22.278,
443
  "step": 650
444
  },
445
  {
 
447
  "step": 650,
448
  "total_flos": 4.006371770595533e+17,
449
  "train_loss": 0.23564630480913015,
450
+ "train_runtime": 92.709,
451
+ "train_samples_per_second": 55.766,
452
+ "train_steps_per_second": 7.011
453
  }
454
  ],
455
  "max_steps": 650,