vikas85 commited on
Commit
d3f9d3f
1 Parent(s): 9229a20

Upload 8 files

Browse files
config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "openai/whisper-large-v2",
3
+ "activation_dropout": 0.0,
4
+ "activation_function": "gelu",
5
+ "apply_spec_augment": false,
6
+ "architectures": [
7
+ "WhisperForConditionalGeneration"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "begin_suppress_tokens": [
11
+ 220,
12
+ 50257
13
+ ],
14
+ "bos_token_id": 50257,
15
+ "classifier_proj_size": 256,
16
+ "d_model": 1280,
17
+ "decoder_attention_heads": 20,
18
+ "decoder_ffn_dim": 5120,
19
+ "decoder_layerdrop": 0.0,
20
+ "decoder_layers": 32,
21
+ "decoder_start_token_id": 50258,
22
+ "dropout": 0.05,
23
+ "encoder_attention_heads": 20,
24
+ "encoder_ffn_dim": 5120,
25
+ "encoder_layerdrop": 0.0,
26
+ "encoder_layers": 32,
27
+ "eos_token_id": 50257,
28
+ "forced_decoder_ids": [
29
+ [
30
+ 1,
31
+ 50278
32
+ ],
33
+ [
34
+ 2,
35
+ 50359
36
+ ],
37
+ [
38
+ 3,
39
+ 50363
40
+ ]
41
+ ],
42
+ "init_std": 0.02,
43
+ "is_encoder_decoder": true,
44
+ "mask_feature_length": 10,
45
+ "mask_feature_min_masks": 0,
46
+ "mask_feature_prob": 0.0,
47
+ "mask_time_length": 10,
48
+ "mask_time_min_masks": 2,
49
+ "mask_time_prob": 0.05,
50
+ "max_length": 448,
51
+ "max_source_positions": 1500,
52
+ "max_target_positions": 448,
53
+ "model_type": "whisper",
54
+ "num_hidden_layers": 32,
55
+ "num_mel_bins": 80,
56
+ "pad_token_id": 50257,
57
+ "scale_embedding": false,
58
+ "suppress_tokens": [],
59
+ "torch_dtype": "float32",
60
+ "transformers_version": "4.29.2",
61
+ "use_cache": false,
62
+ "use_weighted_layer_sum": false,
63
+ "vocab_size": 51865
64
+ }
generation_config.json ADDED
@@ -0,0 +1,225 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "begin_suppress_tokens": [
3
+ 220,
4
+ 50257
5
+ ],
6
+ "bos_token_id": 50257,
7
+ "decoder_start_token_id": 50258,
8
+ "eos_token_id": 50257,
9
+ "forced_decoder_ids": [
10
+ [
11
+ 1,
12
+ 50278
13
+ ],
14
+ [
15
+ 2,
16
+ 50359
17
+ ],
18
+ [
19
+ 3,
20
+ 50363
21
+ ]
22
+ ],
23
+ "is_multilingual": true,
24
+ "lang_to_id": {
25
+ "<|af|>": 50327,
26
+ "<|am|>": 50334,
27
+ "<|ar|>": 50272,
28
+ "<|as|>": 50350,
29
+ "<|az|>": 50304,
30
+ "<|ba|>": 50355,
31
+ "<|be|>": 50330,
32
+ "<|bg|>": 50292,
33
+ "<|bn|>": 50302,
34
+ "<|bo|>": 50347,
35
+ "<|br|>": 50309,
36
+ "<|bs|>": 50315,
37
+ "<|ca|>": 50270,
38
+ "<|cs|>": 50283,
39
+ "<|cy|>": 50297,
40
+ "<|da|>": 50285,
41
+ "<|de|>": 50261,
42
+ "<|el|>": 50281,
43
+ "<|en|>": 50259,
44
+ "<|es|>": 50262,
45
+ "<|et|>": 50307,
46
+ "<|eu|>": 50310,
47
+ "<|fa|>": 50300,
48
+ "<|fi|>": 50277,
49
+ "<|fo|>": 50338,
50
+ "<|fr|>": 50265,
51
+ "<|gl|>": 50319,
52
+ "<|gu|>": 50333,
53
+ "<|haw|>": 50352,
54
+ "<|ha|>": 50354,
55
+ "<|he|>": 50279,
56
+ "<|hi|>": 50276,
57
+ "<|hr|>": 50291,
58
+ "<|ht|>": 50339,
59
+ "<|hu|>": 50286,
60
+ "<|hy|>": 50312,
61
+ "<|id|>": 50275,
62
+ "<|is|>": 50311,
63
+ "<|it|>": 50274,
64
+ "<|ja|>": 50266,
65
+ "<|jw|>": 50356,
66
+ "<|ka|>": 50329,
67
+ "<|kk|>": 50316,
68
+ "<|km|>": 50323,
69
+ "<|kn|>": 50306,
70
+ "<|ko|>": 50264,
71
+ "<|la|>": 50294,
72
+ "<|lb|>": 50345,
73
+ "<|ln|>": 50353,
74
+ "<|lo|>": 50336,
75
+ "<|lt|>": 50293,
76
+ "<|lv|>": 50301,
77
+ "<|mg|>": 50349,
78
+ "<|mi|>": 50295,
79
+ "<|mk|>": 50308,
80
+ "<|ml|>": 50296,
81
+ "<|mn|>": 50314,
82
+ "<|mr|>": 50320,
83
+ "<|ms|>": 50282,
84
+ "<|mt|>": 50343,
85
+ "<|my|>": 50346,
86
+ "<|ne|>": 50313,
87
+ "<|nl|>": 50271,
88
+ "<|nn|>": 50342,
89
+ "<|no|>": 50288,
90
+ "<|oc|>": 50328,
91
+ "<|pa|>": 50321,
92
+ "<|pl|>": 50269,
93
+ "<|ps|>": 50340,
94
+ "<|pt|>": 50267,
95
+ "<|ro|>": 50284,
96
+ "<|ru|>": 50263,
97
+ "<|sa|>": 50344,
98
+ "<|sd|>": 50332,
99
+ "<|si|>": 50322,
100
+ "<|sk|>": 50298,
101
+ "<|sl|>": 50305,
102
+ "<|sn|>": 50324,
103
+ "<|so|>": 50326,
104
+ "<|sq|>": 50317,
105
+ "<|sr|>": 50303,
106
+ "<|su|>": 50357,
107
+ "<|sv|>": 50273,
108
+ "<|sw|>": 50318,
109
+ "<|ta|>": 50287,
110
+ "<|te|>": 50299,
111
+ "<|tg|>": 50331,
112
+ "<|th|>": 50289,
113
+ "<|tk|>": 50341,
114
+ "<|tl|>": 50348,
115
+ "<|tr|>": 50268,
116
+ "<|tt|>": 50351,
117
+ "<|uk|>": 50280,
118
+ "<|ur|>": 50290,
119
+ "<|uz|>": 50337,
120
+ "<|vi|>": 50278,
121
+ "<|yi|>": 50335,
122
+ "<|yo|>": 50325,
123
+ "<|zh|>": 50260
124
+ },
125
+ "max_initial_timestamp_index": 1,
126
+ "max_length": 448,
127
+ "no_timestamps_token_id": 50363,
128
+ "pad_token_id": 50257,
129
+ "return_timestamps": false,
130
+ "suppress_tokens": [
131
+ 1,
132
+ 2,
133
+ 7,
134
+ 8,
135
+ 9,
136
+ 10,
137
+ 14,
138
+ 25,
139
+ 26,
140
+ 27,
141
+ 28,
142
+ 29,
143
+ 31,
144
+ 58,
145
+ 59,
146
+ 60,
147
+ 61,
148
+ 62,
149
+ 63,
150
+ 90,
151
+ 91,
152
+ 92,
153
+ 93,
154
+ 359,
155
+ 503,
156
+ 522,
157
+ 542,
158
+ 873,
159
+ 893,
160
+ 902,
161
+ 918,
162
+ 922,
163
+ 931,
164
+ 1350,
165
+ 1853,
166
+ 1982,
167
+ 2460,
168
+ 2627,
169
+ 3246,
170
+ 3253,
171
+ 3268,
172
+ 3536,
173
+ 3846,
174
+ 3961,
175
+ 4183,
176
+ 4667,
177
+ 6585,
178
+ 6647,
179
+ 7273,
180
+ 9061,
181
+ 9383,
182
+ 10428,
183
+ 10929,
184
+ 11938,
185
+ 12033,
186
+ 12331,
187
+ 12562,
188
+ 13793,
189
+ 14157,
190
+ 14635,
191
+ 15265,
192
+ 15618,
193
+ 16553,
194
+ 16604,
195
+ 18362,
196
+ 18956,
197
+ 20075,
198
+ 21675,
199
+ 22520,
200
+ 26130,
201
+ 26161,
202
+ 26435,
203
+ 28279,
204
+ 29464,
205
+ 31650,
206
+ 32302,
207
+ 32470,
208
+ 36865,
209
+ 42863,
210
+ 47425,
211
+ 49870,
212
+ 50254,
213
+ 50258,
214
+ 50358,
215
+ 50359,
216
+ 50360,
217
+ 50361,
218
+ 50362
219
+ ],
220
+ "task_to_id": {
221
+ "transcribe": 50359,
222
+ "translate": 50358
223
+ },
224
+ "transformers_version": "4.29.2"
225
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "chunk_length": 30,
3
+ "feature_extractor_type": "WhisperFeatureExtractor",
4
+ "feature_size": 80,
5
+ "hop_length": 160,
6
+ "n_fft": 400,
7
+ "n_samples": 480000,
8
+ "nb_max_frames": 3000,
9
+ "padding_side": "right",
10
+ "padding_value": 0.0,
11
+ "processor_class": "WhisperProcessor",
12
+ "return_attention_mask": false,
13
+ "sampling_rate": 16000
14
+ }
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09a8eb5cc45a902bad3e1a3e996ccde99bcc71081840ac04743908052048448e
3
+ size 14511
scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a5136c4f35721045adb593132aabc63996fa4620f6d3e839ea96787517b6016
3
+ size 557
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a591c4c5570b9a8471ab6140641b9dc0b4e17512da7bd0c767a4ad2d7ef6083c
3
+ size 627
trainer_state.json ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.16838560303094086,
3
+ "best_model_checkpoint": "./whisper-all\\checkpoint-10500",
4
+ "epoch": 5.839822024471635,
5
+ "global_step": 10500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.28,
12
+ "learning_rate": 9.721382697393274e-07,
13
+ "loss": 0.9517,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.28,
18
+ "eval_loss": 0.23364929854869843,
19
+ "eval_runtime": 2055.8229,
20
+ "eval_samples_per_second": 1.388,
21
+ "eval_steps_per_second": 0.174,
22
+ "eval_wer": 12.261746065155874,
23
+ "step": 500
24
+ },
25
+ {
26
+ "epoch": 0.56,
27
+ "learning_rate": 9.249149981110691e-07,
28
+ "loss": 0.4857,
29
+ "step": 1000
30
+ },
31
+ {
32
+ "epoch": 0.56,
33
+ "eval_loss": 0.19377797842025757,
34
+ "eval_runtime": 2058.47,
35
+ "eval_samples_per_second": 1.386,
36
+ "eval_steps_per_second": 0.173,
37
+ "eval_wer": 10.500713300123952,
38
+ "step": 1000
39
+ },
40
+ {
41
+ "epoch": 0.83,
42
+ "learning_rate": 8.777861730260671e-07,
43
+ "loss": 0.4437,
44
+ "step": 1500
45
+ },
46
+ {
47
+ "epoch": 0.83,
48
+ "eval_loss": 0.15837284922599792,
49
+ "eval_runtime": 2059.2478,
50
+ "eval_samples_per_second": 1.386,
51
+ "eval_steps_per_second": 0.173,
52
+ "eval_wer": 8.982904183914497,
53
+ "step": 1500
54
+ },
55
+ {
56
+ "epoch": 1.11,
57
+ "learning_rate": 8.305629013978088e-07,
58
+ "loss": 0.3544,
59
+ "step": 2000
60
+ },
61
+ {
62
+ "epoch": 1.11,
63
+ "eval_loss": 0.1296420842409134,
64
+ "eval_runtime": 2050.2346,
65
+ "eval_samples_per_second": 1.392,
66
+ "eval_steps_per_second": 0.174,
67
+ "eval_wer": 7.067517949437545,
68
+ "step": 2000
69
+ },
70
+ {
71
+ "epoch": 1.39,
72
+ "learning_rate": 7.833396297695503e-07,
73
+ "loss": 0.2743,
74
+ "step": 2500
75
+ },
76
+ {
77
+ "epoch": 1.39,
78
+ "eval_loss": 0.10552296042442322,
79
+ "eval_runtime": 2046.8577,
80
+ "eval_samples_per_second": 1.394,
81
+ "eval_steps_per_second": 0.174,
82
+ "eval_wer": 6.368249959072944,
83
+ "step": 2500
84
+ },
85
+ {
86
+ "epoch": 1.67,
87
+ "learning_rate": 7.362108046845486e-07,
88
+ "loss": 0.2819,
89
+ "step": 3000
90
+ },
91
+ {
92
+ "epoch": 1.67,
93
+ "eval_loss": 0.08085598796606064,
94
+ "eval_runtime": 2023.4637,
95
+ "eval_samples_per_second": 1.41,
96
+ "eval_steps_per_second": 0.176,
97
+ "eval_wer": 4.448186346734021,
98
+ "step": 3000
99
+ },
100
+ {
101
+ "epoch": 1.95,
102
+ "learning_rate": 6.889875330562901e-07,
103
+ "loss": 0.2629,
104
+ "step": 3500
105
+ },
106
+ {
107
+ "epoch": 1.95,
108
+ "eval_loss": 0.06196921318769455,
109
+ "eval_runtime": 2016.6651,
110
+ "eval_samples_per_second": 1.415,
111
+ "eval_steps_per_second": 0.177,
112
+ "eval_wer": 3.309244837344185,
113
+ "step": 3500
114
+ },
115
+ {
116
+ "epoch": 2.22,
117
+ "learning_rate": 6.417642614280318e-07,
118
+ "loss": 0.166,
119
+ "step": 4000
120
+ },
121
+ {
122
+ "epoch": 2.22,
123
+ "eval_loss": 0.049665648490190506,
124
+ "eval_runtime": 2026.4551,
125
+ "eval_samples_per_second": 1.408,
126
+ "eval_steps_per_second": 0.176,
127
+ "eval_wer": 2.70586309314998,
128
+ "step": 4000
129
+ },
130
+ {
131
+ "epoch": 2.5,
132
+ "learning_rate": 5.945409897997733e-07,
133
+ "loss": 0.1443,
134
+ "step": 4500
135
+ },
136
+ {
137
+ "epoch": 2.5,
138
+ "eval_loss": 0.043939754366874695,
139
+ "eval_runtime": 3073.8688,
140
+ "eval_samples_per_second": 0.928,
141
+ "eval_steps_per_second": 0.116,
142
+ "eval_wer": 2.4345751771556867,
143
+ "step": 4500
144
+ },
145
+ {
146
+ "epoch": 2.78,
147
+ "learning_rate": 5.47317718171515e-07,
148
+ "loss": 0.1403,
149
+ "step": 5000
150
+ },
151
+ {
152
+ "epoch": 2.78,
153
+ "eval_loss": 0.03313903510570526,
154
+ "eval_runtime": 2041.5077,
155
+ "eval_samples_per_second": 1.398,
156
+ "eval_steps_per_second": 0.175,
157
+ "eval_wer": 1.725952431067144,
158
+ "step": 5000
159
+ },
160
+ {
161
+ "epoch": 3.06,
162
+ "learning_rate": 5.000944465432565e-07,
163
+ "loss": 0.1229,
164
+ "step": 5500
165
+ },
166
+ {
167
+ "epoch": 3.06,
168
+ "eval_loss": 0.025085289031267166,
169
+ "eval_runtime": 2036.5578,
170
+ "eval_samples_per_second": 1.401,
171
+ "eval_steps_per_second": 0.175,
172
+ "eval_wer": 1.2979723566968357,
173
+ "step": 5500
174
+ },
175
+ {
176
+ "epoch": 3.34,
177
+ "learning_rate": 4.528711749149981e-07,
178
+ "loss": 0.0666,
179
+ "step": 6000
180
+ },
181
+ {
182
+ "epoch": 3.34,
183
+ "eval_loss": 0.02561613917350769,
184
+ "eval_runtime": 2036.521,
185
+ "eval_samples_per_second": 1.401,
186
+ "eval_steps_per_second": 0.175,
187
+ "eval_wer": 1.4336163146939827,
188
+ "step": 6000
189
+ },
190
+ {
191
+ "epoch": 3.62,
192
+ "learning_rate": 4.056479032867397e-07,
193
+ "loss": 0.0681,
194
+ "step": 6500
195
+ },
196
+ {
197
+ "epoch": 3.62,
198
+ "eval_loss": 0.018902545794844627,
199
+ "eval_runtime": 2042.0741,
200
+ "eval_samples_per_second": 1.398,
201
+ "eval_steps_per_second": 0.175,
202
+ "eval_wer": 1.0687808414602773,
203
+ "step": 6500
204
+ },
205
+ {
206
+ "epoch": 3.89,
207
+ "learning_rate": 3.584246316584813e-07,
208
+ "loss": 0.063,
209
+ "step": 7000
210
+ },
211
+ {
212
+ "epoch": 3.89,
213
+ "eval_loss": 0.011477218009531498,
214
+ "eval_runtime": 2040.8765,
215
+ "eval_samples_per_second": 1.398,
216
+ "eval_steps_per_second": 0.175,
217
+ "eval_wer": 0.8068476811899249,
218
+ "step": 7000
219
+ },
220
+ {
221
+ "epoch": 4.17,
222
+ "learning_rate": 3.112013600302229e-07,
223
+ "loss": 0.0427,
224
+ "step": 7500
225
+ },
226
+ {
227
+ "epoch": 4.17,
228
+ "eval_loss": 0.010536368936300278,
229
+ "eval_runtime": 2038.2156,
230
+ "eval_samples_per_second": 1.4,
231
+ "eval_steps_per_second": 0.175,
232
+ "eval_wer": 0.47943123085198436,
233
+ "step": 7500
234
+ },
235
+ {
236
+ "epoch": 4.45,
237
+ "learning_rate": 2.6397808840196447e-07,
238
+ "loss": 0.0277,
239
+ "step": 8000
240
+ },
241
+ {
242
+ "epoch": 4.45,
243
+ "eval_loss": 0.009207101538777351,
244
+ "eval_runtime": 2049.3201,
245
+ "eval_samples_per_second": 1.393,
246
+ "eval_steps_per_second": 0.174,
247
+ "eval_wer": 0.4817699197829697,
248
+ "step": 8000
249
+ },
250
+ {
251
+ "epoch": 4.73,
252
+ "learning_rate": 2.1675481677370608e-07,
253
+ "loss": 0.0289,
254
+ "step": 8500
255
+ },
256
+ {
257
+ "epoch": 4.73,
258
+ "eval_loss": 0.007379856426268816,
259
+ "eval_runtime": 2045.1755,
260
+ "eval_samples_per_second": 1.395,
261
+ "eval_steps_per_second": 0.175,
262
+ "eval_wer": 0.35314202857877874,
263
+ "step": 8500
264
+ },
265
+ {
266
+ "epoch": 5.01,
267
+ "learning_rate": 1.6953154514544768e-07,
268
+ "loss": 0.0253,
269
+ "step": 9000
270
+ },
271
+ {
272
+ "epoch": 5.01,
273
+ "eval_loss": 0.005186205264180899,
274
+ "eval_runtime": 2053.6472,
275
+ "eval_samples_per_second": 1.39,
276
+ "eval_steps_per_second": 0.174,
277
+ "eval_wer": 0.21282069271966134,
278
+ "step": 9000
279
+ },
280
+ {
281
+ "epoch": 5.28,
282
+ "learning_rate": 1.2230827351718926e-07,
283
+ "loss": 0.0133,
284
+ "step": 9500
285
+ },
286
+ {
287
+ "epoch": 5.28,
288
+ "eval_loss": 0.005096600856631994,
289
+ "eval_runtime": 2024.6952,
290
+ "eval_samples_per_second": 1.41,
291
+ "eval_steps_per_second": 0.176,
292
+ "eval_wer": 0.2268528263055731,
293
+ "step": 9500
294
+ },
295
+ {
296
+ "epoch": 5.56,
297
+ "learning_rate": 7.508500188893087e-08,
298
+ "loss": 0.0118,
299
+ "step": 10000
300
+ },
301
+ {
302
+ "epoch": 5.56,
303
+ "eval_loss": 0.004013683646917343,
304
+ "eval_runtime": 2018.9797,
305
+ "eval_samples_per_second": 1.414,
306
+ "eval_steps_per_second": 0.177,
307
+ "eval_wer": 0.1800790476858673,
308
+ "step": 10000
309
+ },
310
+ {
311
+ "epoch": 5.84,
312
+ "learning_rate": 2.786173026067246e-08,
313
+ "loss": 0.0095,
314
+ "step": 10500
315
+ },
316
+ {
317
+ "epoch": 5.84,
318
+ "eval_loss": 0.0037340286653488874,
319
+ "eval_runtime": 2042.3697,
320
+ "eval_samples_per_second": 1.397,
321
+ "eval_steps_per_second": 0.175,
322
+ "eval_wer": 0.16838560303094086,
323
+ "step": 10500
324
+ }
325
+ ],
326
+ "max_steps": 10788,
327
+ "num_train_epochs": 6,
328
+ "total_flos": 3.566927314944e+20,
329
+ "trial_name": null,
330
+ "trial_params": null
331
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa6e60a1ca81793b9425bb141964ab895b5de26ac69a29fcba585b046bc5d899
3
+ size 4091