leejw51 commited on
Commit
dadf7de
1 Parent(s): b56a17b

End of training

Browse files
all_results.json CHANGED
@@ -2,11 +2,11 @@
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
- "eval_runtime": 1.462,
6
- "eval_samples_per_second": 90.968,
7
- "eval_steps_per_second": 11.628,
8
- "train_loss": 0.0,
9
- "train_runtime": 0.0708,
10
- "train_samples_per_second": 72973.629,
11
- "train_steps_per_second": 9174.634
12
  }
 
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
+ "eval_runtime": 0.7758,
6
+ "eval_samples_per_second": 171.437,
7
+ "eval_steps_per_second": 21.913,
8
+ "train_loss": 0.23564630480913015,
9
+ "train_runtime": 101.4306,
10
+ "train_samples_per_second": 50.971,
11
+ "train_steps_per_second": 6.408
12
  }
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
- "eval_runtime": 1.462,
6
- "eval_samples_per_second": 90.968,
7
- "eval_steps_per_second": 11.628
8
  }
 
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9849624060150376,
4
  "eval_loss": 0.08750259131193161,
5
+ "eval_runtime": 0.7758,
6
+ "eval_samples_per_second": 171.437,
7
+ "eval_steps_per_second": 21.913
8
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.0,
4
- "train_runtime": 0.0708,
5
- "train_samples_per_second": 72973.629,
6
- "train_steps_per_second": 9174.634
7
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.23564630480913015,
4
+ "train_runtime": 101.4306,
5
+ "train_samples_per_second": 50.971,
6
+ "train_steps_per_second": 6.408
7
  }
trainer_state.json CHANGED
@@ -89,9 +89,9 @@
89
  "epoch": 1.0,
90
  "eval_accuracy": 0.9624060150375939,
91
  "eval_loss": 0.23068006336688995,
92
- "eval_runtime": 0.7684,
93
- "eval_samples_per_second": 173.093,
94
- "eval_steps_per_second": 22.125,
95
  "step": 130
96
  },
97
  {
@@ -176,9 +176,9 @@
176
  "epoch": 2.0,
177
  "eval_accuracy": 0.9924812030075187,
178
  "eval_loss": 0.11085593700408936,
179
- "eval_runtime": 0.7745,
180
- "eval_samples_per_second": 171.733,
181
- "eval_steps_per_second": 21.951,
182
  "step": 260
183
  },
184
  {
@@ -263,9 +263,9 @@
263
  "epoch": 3.0,
264
  "eval_accuracy": 0.9699248120300752,
265
  "eval_loss": 0.1108752116560936,
266
- "eval_runtime": 0.7607,
267
- "eval_samples_per_second": 174.831,
268
- "eval_steps_per_second": 22.347,
269
  "step": 390
270
  },
271
  {
@@ -350,9 +350,9 @@
350
  "epoch": 4.0,
351
  "eval_accuracy": 0.9849624060150376,
352
  "eval_loss": 0.08750259131193161,
353
- "eval_runtime": 0.7575,
354
- "eval_samples_per_second": 175.569,
355
- "eval_steps_per_second": 22.441,
356
  "step": 520
357
  },
358
  {
@@ -437,19 +437,19 @@
437
  "epoch": 5.0,
438
  "eval_accuracy": 0.9774436090225563,
439
  "eval_loss": 0.08863506466150284,
440
- "eval_runtime": 0.7631,
441
- "eval_samples_per_second": 174.294,
442
- "eval_steps_per_second": 22.278,
443
  "step": 650
444
  },
445
  {
446
  "epoch": 5.0,
447
  "step": 650,
448
  "total_flos": 4.006371770595533e+17,
449
- "train_loss": 0.0,
450
- "train_runtime": 0.0708,
451
- "train_samples_per_second": 72973.629,
452
- "train_steps_per_second": 9174.634
453
  }
454
  ],
455
  "max_steps": 650,
 
89
  "epoch": 1.0,
90
  "eval_accuracy": 0.9624060150375939,
91
  "eval_loss": 0.23068006336688995,
92
+ "eval_runtime": 0.7854,
93
+ "eval_samples_per_second": 169.35,
94
+ "eval_steps_per_second": 21.646,
95
  "step": 130
96
  },
97
  {
 
176
  "epoch": 2.0,
177
  "eval_accuracy": 0.9924812030075187,
178
  "eval_loss": 0.11085593700408936,
179
+ "eval_runtime": 0.7261,
180
+ "eval_samples_per_second": 183.181,
181
+ "eval_steps_per_second": 23.414,
182
  "step": 260
183
  },
184
  {
 
263
  "epoch": 3.0,
264
  "eval_accuracy": 0.9699248120300752,
265
  "eval_loss": 0.1108752116560936,
266
+ "eval_runtime": 0.7271,
267
+ "eval_samples_per_second": 182.92,
268
+ "eval_steps_per_second": 23.381,
269
  "step": 390
270
  },
271
  {
 
350
  "epoch": 4.0,
351
  "eval_accuracy": 0.9849624060150376,
352
  "eval_loss": 0.08750259131193161,
353
+ "eval_runtime": 0.7445,
354
+ "eval_samples_per_second": 178.634,
355
+ "eval_steps_per_second": 22.833,
356
  "step": 520
357
  },
358
  {
 
437
  "epoch": 5.0,
438
  "eval_accuracy": 0.9774436090225563,
439
  "eval_loss": 0.08863506466150284,
440
+ "eval_runtime": 0.7378,
441
+ "eval_samples_per_second": 180.271,
442
+ "eval_steps_per_second": 23.042,
443
  "step": 650
444
  },
445
  {
446
  "epoch": 5.0,
447
  "step": 650,
448
  "total_flos": 4.006371770595533e+17,
449
+ "train_loss": 0.23564630480913015,
450
+ "train_runtime": 101.4306,
451
+ "train_samples_per_second": 50.971,
452
+ "train_steps_per_second": 6.408
453
  }
454
  ],
455
  "max_steps": 650,