infinitejoy commited on
Commit
d7bdd33
1 Parent(s): 09eb23e

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "eval_loss": 0.7654190063476562,
4
+ "eval_runtime": 69.7723,
5
+ "eval_samples": 1716,
6
+ "eval_samples_per_second": 24.594,
7
+ "eval_steps_per_second": 0.774,
8
+ "eval_wer": 0.5185841828658266,
9
+ "train_loss": 3.4940547976286513,
10
+ "train_runtime": 2130.2547,
11
+ "train_samples": 3670,
12
+ "train_samples_per_second": 17.228,
13
+ "train_steps_per_second": 0.54
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "eval_loss": 0.7654190063476562,
4
+ "eval_runtime": 69.7723,
5
+ "eval_samples": 1716,
6
+ "eval_samples_per_second": 24.594,
7
+ "eval_steps_per_second": 0.774,
8
+ "eval_wer": 0.5185841828658266
9
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3221b9c28943b03d04aa88289fd364b0f078d534902800b84f78f85e820dcec
3
  size 1262104049
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23d23e377b908f06fea252ccbf8dbcbd6cc1f0217db94f725fb5f5a23cb45d41
3
  size 1262104049
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "train_loss": 3.4940547976286513,
4
+ "train_runtime": 2130.2547,
5
+ "train_samples": 3670,
6
+ "train_samples_per_second": 17.228,
7
+ "train_steps_per_second": 0.54
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,109 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
+ "global_step": 1150,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.87,
12
+ "learning_rate": 1.68e-05,
13
+ "loss": 11.4306,
14
+ "step": 100
15
+ },
16
+ {
17
+ "epoch": 1.74,
18
+ "learning_rate": 3.4299999999999993e-05,
19
+ "loss": 4.3407,
20
+ "step": 200
21
+ },
22
+ {
23
+ "epoch": 2.61,
24
+ "learning_rate": 5.179999999999999e-05,
25
+ "loss": 3.2465,
26
+ "step": 300
27
+ },
28
+ {
29
+ "epoch": 3.48,
30
+ "learning_rate": 6.929999999999999e-05,
31
+ "loss": 3.0269,
32
+ "step": 400
33
+ },
34
+ {
35
+ "epoch": 3.48,
36
+ "eval_loss": 2.9771385192871094,
37
+ "eval_runtime": 71.2409,
38
+ "eval_samples_per_second": 24.087,
39
+ "eval_steps_per_second": 0.758,
40
+ "eval_wer": 1.0,
41
+ "step": 400
42
+ },
43
+ {
44
+ "epoch": 4.35,
45
+ "learning_rate": 6.104e-05,
46
+ "loss": 2.9973,
47
+ "step": 500
48
+ },
49
+ {
50
+ "epoch": 5.22,
51
+ "learning_rate": 5.1706666666666664e-05,
52
+ "loss": 2.9206,
53
+ "step": 600
54
+ },
55
+ {
56
+ "epoch": 6.09,
57
+ "learning_rate": 4.237333333333332e-05,
58
+ "loss": 2.8692,
59
+ "step": 700
60
+ },
61
+ {
62
+ "epoch": 6.96,
63
+ "learning_rate": 3.3039999999999995e-05,
64
+ "loss": 2.7902,
65
+ "step": 800
66
+ },
67
+ {
68
+ "epoch": 6.96,
69
+ "eval_loss": 2.4356915950775146,
70
+ "eval_runtime": 71.3351,
71
+ "eval_samples_per_second": 24.055,
72
+ "eval_steps_per_second": 0.757,
73
+ "eval_wer": 0.9988602545431521,
74
+ "step": 800
75
+ },
76
+ {
77
+ "epoch": 7.83,
78
+ "learning_rate": 2.3706666666666664e-05,
79
+ "loss": 2.3184,
80
+ "step": 900
81
+ },
82
+ {
83
+ "epoch": 8.7,
84
+ "learning_rate": 1.4373333333333332e-05,
85
+ "loss": 1.8236,
86
+ "step": 1000
87
+ },
88
+ {
89
+ "epoch": 9.57,
90
+ "learning_rate": 5.039999999999999e-06,
91
+ "loss": 1.6258,
92
+ "step": 1100
93
+ },
94
+ {
95
+ "epoch": 10.0,
96
+ "step": 1150,
97
+ "total_flos": 5.422401103281132e+18,
98
+ "train_loss": 3.4940547976286513,
99
+ "train_runtime": 2130.2547,
100
+ "train_samples_per_second": 17.228,
101
+ "train_steps_per_second": 0.54
102
+ }
103
+ ],
104
+ "max_steps": 1150,
105
+ "num_train_epochs": 10,
106
+ "total_flos": 5.422401103281132e+18,
107
+ "trial_name": null,
108
+ "trial_params": null
109
+ }