maratos commited on
Commit
2b654f4
·
verified ·
1 Parent(s): f3b658e

Training in progress, step 5000

Browse files
Files changed (3) hide show
  1. config.json +15 -105
  2. model.safetensors +2 -2
  3. training_args.bin +2 -2
config.json CHANGED
@@ -8,29 +8,23 @@
8
  ],
9
  "attention_dropout": 0.0,
10
  "begin_suppress_tokens": [
11
- 220,
12
- 50256
13
  ],
14
- "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
  "d_model": 768,
17
  "decoder_attention_heads": 12,
18
  "decoder_ffn_dim": 3072,
19
  "decoder_layerdrop": 0.0,
20
  "decoder_layers": 12,
21
- "decoder_start_token_id": 50257,
22
  "dropout": 0.0,
23
  "encoder_attention_heads": 12,
24
  "encoder_ffn_dim": 3072,
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 12,
27
- "eos_token_id": 50256,
28
- "forced_decoder_ids": [
29
- [
30
- 1,
31
- 50362
32
- ]
33
- ],
34
  "init_std": 0.02,
35
  "is_encoder_decoder": true,
36
  "mask_feature_length": 10,
@@ -39,110 +33,26 @@
39
  "mask_time_length": 10,
40
  "mask_time_min_masks": 2,
41
  "mask_time_prob": 0.05,
42
- "max_length": 448,
43
  "max_source_positions": 1500,
44
- "max_target_positions": 448,
45
  "median_filter_width": 7,
46
  "model_type": "whisper",
47
  "num_hidden_layers": 12,
48
  "num_mel_bins": 80,
49
- "pad_token_id": 50256,
50
  "scale_embedding": false,
51
  "suppress_tokens": [
52
- 1,
53
- 2,
54
- 7,
55
- 8,
56
- 9,
57
- 10,
58
- 14,
59
- 25,
60
- 26,
61
- 27,
62
- 28,
63
- 29,
64
- 31,
65
- 58,
66
- 59,
67
- 60,
68
- 61,
69
- 62,
70
- 63,
71
- 90,
72
- 91,
73
- 92,
74
- 93,
75
- 357,
76
- 366,
77
- 438,
78
- 532,
79
- 685,
80
- 705,
81
- 796,
82
- 930,
83
- 1058,
84
- 1220,
85
- 1267,
86
- 1279,
87
- 1303,
88
- 1343,
89
- 1377,
90
- 1391,
91
- 1635,
92
- 1782,
93
- 1875,
94
- 2162,
95
- 2361,
96
- 2488,
97
- 3467,
98
- 4008,
99
- 4211,
100
- 4600,
101
- 4808,
102
- 5299,
103
- 5855,
104
- 6329,
105
- 7203,
106
- 9609,
107
- 9959,
108
- 10563,
109
- 10786,
110
- 11420,
111
- 11709,
112
- 11907,
113
- 13163,
114
- 13697,
115
- 13700,
116
- 14808,
117
- 15306,
118
- 16410,
119
- 16791,
120
- 17992,
121
- 19203,
122
- 19510,
123
- 20724,
124
- 22305,
125
- 22935,
126
- 27007,
127
- 30109,
128
- 30420,
129
- 33409,
130
- 34949,
131
- 40283,
132
- 40493,
133
- 40549,
134
- 47282,
135
- 49146,
136
- 50257,
137
- 50357,
138
- 50358,
139
- 50359,
140
- 50360,
141
- 50361
142
  ],
143
  "torch_dtype": "float32",
144
  "transformers_version": "4.42.3",
145
  "use_cache": true,
146
  "use_weighted_layer_sum": false,
147
- "vocab_size": 51864
148
  }
 
8
  ],
9
  "attention_dropout": 0.0,
10
  "begin_suppress_tokens": [
11
+ 1541
 
12
  ],
13
+ "bos_token_id": 1546,
14
  "classifier_proj_size": 256,
15
  "d_model": 768,
16
  "decoder_attention_heads": 12,
17
  "decoder_ffn_dim": 3072,
18
  "decoder_layerdrop": 0.0,
19
  "decoder_layers": 12,
20
+ "decoder_start_token_id": 1546,
21
  "dropout": 0.0,
22
  "encoder_attention_heads": 12,
23
  "encoder_ffn_dim": 3072,
24
  "encoder_layerdrop": 0.0,
25
  "encoder_layers": 12,
26
+ "eos_token_id": 1541,
27
+ "forced_decoder_ids": null,
 
 
 
 
 
28
  "init_std": 0.02,
29
  "is_encoder_decoder": true,
30
  "mask_feature_length": 10,
 
33
  "mask_time_length": 10,
34
  "mask_time_min_masks": 2,
35
  "mask_time_prob": 0.05,
36
+ "max_length": 512,
37
  "max_source_positions": 1500,
38
+ "max_target_positions": 512,
39
  "median_filter_width": 7,
40
  "model_type": "whisper",
41
  "num_hidden_layers": 12,
42
  "num_mel_bins": 80,
43
+ "pad_token_id": 1541,
44
  "scale_embedding": false,
45
  "suppress_tokens": [
46
+ 1546,
47
+ 1548,
48
+ 1547,
49
+ 1544,
50
+ 1545,
51
+ 1542
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52
  ],
53
  "torch_dtype": "float32",
54
  "transformers_version": "4.42.3",
55
  "use_cache": true,
56
  "use_weighted_layer_sum": false,
57
+ "vocab_size": 1549
58
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0b76a193d39659f946f662f382749c4194d6a381254920bade93f28997b7e89
3
- size 966992008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d9a87bb0f09b681ca1446cfaa48550f6dbe3f199713c54736e4a8cc364c1036
3
+ size 817182816
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a37eaafbf60fec9f78060f0e8a52b0d5fdc4856683fc7cd8d4eade1b027dc09
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ce83fe46fdd2f27622c268af045ebf91760763f77aa934b399fe0067407b292
3
+ size 7480