Xenova HF staff commited on
Commit
ae48508
1 Parent(s): ff5bc38

Upload folder using huggingface_hub

Browse files
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6f57dadddd3dbff6d785fbd14a18cedc6ed38753638dc820e1eeb20cb672ba8
3
- size 118664208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7cede2839ab27809070c7f66e784b30d4a41b150f75011ff0f4f9edacfbcae5
3
+ size 118608081
onnx/decoder_model_merged_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1134495cde770610187883ebb0e049c9c4467a5979f64e382ee64c432825ddf1
3
- size 86234792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be57bc7ba26db094bbacd653858c0de7a897b101cca80bb2e4d1f271255b9245
3
+ size 86178668
onnx/decoder_model_merged_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72b8537d2500bbee0ad8518deab0c3526680f734dea14d22e05100a1d85d7cc0
3
- size 59565877
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33afab390ade9c1fdf3fb05ee6df52b540bdbf7162835e9d4a7e58d1f8a46108
3
+ size 59663763
onnx/decoder_model_merged_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef8d12d2e403fb06a77529c25d9882b3f383ec0607eda560f72b0a9dbf7997a0
3
- size 110358643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e34cff2a26247deccc743326982616a407e0a7c9d914e270e0d5d05744bb0f
3
+ size 30792224
onnx/decoder_model_merged_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8941dbc39544b5930ca3c317fc072fe2947fe3fbc46fddaf741ecc2324799c3
3
- size 86824080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b22be1c461f4ed461d18f4f14c9a1e44f547dfa682c68d69e3c15f439074adb
3
+ size 86767956
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef8d12d2e403fb06a77529c25d9882b3f383ec0607eda560f72b0a9dbf7997a0
3
- size 110358643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e34cff2a26247deccc743326982616a407e0a7c9d914e270e0d5d05744bb0f
3
+ size 30792224
onnx/decoder_model_merged_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d6d76bf090cf1cff1ec019de26d9d30329288a613482341112aa7dfb2353fa1
3
- size 110358664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e39590dff9cbe8b5b8869490272481e69d3c8f3f9d788b2e2aaecd5e3c8911e9
3
+ size 30792254
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8944ec04111e040305cdb07ac97f50363024255bf0bdc67ab93ecb76645f31ae
3
- size 32894434
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24c4760519687529f8c0988534cc29a7b8985bb2c234ac561598ba0e9601e1e9
3
+ size 32915848
onnx/encoder_model_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a4b5391078304c8b62e3a73dfd8ac069511cbe0a8a30f2db4a06914a95e63a4
3
- size 8567893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c08c37e2ac65abf410780bfa7af4647008abb3859dd2099b2985776129c926c
3
+ size 8589307
onnx/encoder_model_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83fb3aa52145a42351b6b8cc3f520895fcfd297bf960a017fe9e91dee9484e9b
3
- size 16477869
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9fdf5764b679a466a659158c179a9a46426c28a91483665a7f359447ed6799f
3
+ size 16534300
onnx/encoder_model_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbcb11fb083f3794f9422311fe2be56c2d91792e79674e241185aad01f1c5389
3
- size 10083654
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4f55981684451f5eda146b178b565385ae3a811e6056cf476cee09caadc6c7
3
+ size 10140085
onnx/encoder_model_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3e90a0256c385b03e6436290ffbf48eeee0515aaac9b00224efb97f3aded463
3
- size 9010109
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dda4f0cfcc313e3bbbc3ee236f1f26907bcbc87a1a5c7e91f2b35b5218abb8b7
3
+ size 9031523
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbc40fd63079402b8e63aecd4a21bd5a52f00ff6524729bca022ea74961786aa
3
- size 10083667
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43ae7d83c47d4fc8f69c49d8b9383407e725f876a8286de8b1904371c5583c4b
3
+ size 10140098
onnx/encoder_model_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbc40fd63079402b8e63aecd4a21bd5a52f00ff6524729bca022ea74961786aa
3
- size 10083667
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43ae7d83c47d4fc8f69c49d8b9383407e725f876a8286de8b1904371c5583c4b
3
+ size 10140098
quantize_config.json CHANGED
@@ -5,18 +5,23 @@
5
  "encoder_model": {
6
  "op_types": [
7
  "Add",
 
 
8
  "Conv",
9
  "Div",
10
  "Erf",
 
11
  "MatMul",
12
  "Mul",
13
  "Pow",
14
  "ReduceMean",
15
  "Reshape",
 
16
  "Softmax",
17
  "Sqrt",
18
  "Sub",
19
- "Transpose"
 
20
  ],
21
  "weight_type": "QUInt8"
22
  },
@@ -77,6 +82,7 @@
77
  "decoder_model_merged": {
78
  "op_types": [
79
  "Add",
 
80
  "Concat",
81
  "Constant",
82
  "ConstantOfShape",
@@ -114,18 +120,23 @@
114
  "encoder_model": {
115
  "op_types": [
116
  "Add",
 
 
117
  "Conv",
118
  "Div",
119
  "Erf",
 
120
  "MatMul",
121
  "Mul",
122
  "Pow",
123
  "ReduceMean",
124
  "Reshape",
 
125
  "Softmax",
126
  "Sqrt",
127
  "Sub",
128
- "Transpose"
 
129
  ],
130
  "weight_type": "QInt8"
131
  },
@@ -186,6 +197,7 @@
186
  "decoder_model_merged": {
187
  "op_types": [
188
  "Add",
 
189
  "Concat",
190
  "Constant",
191
  "ConstantOfShape",
@@ -223,18 +235,23 @@
223
  "encoder_model": {
224
  "op_types": [
225
  "Add",
 
 
226
  "Conv",
227
  "Div",
228
  "Erf",
 
229
  "MatMul",
230
  "Mul",
231
  "Pow",
232
  "ReduceMean",
233
  "Reshape",
 
234
  "Softmax",
235
  "Sqrt",
236
  "Sub",
237
- "Transpose"
 
238
  ],
239
  "weight_type": "QUInt8"
240
  },
@@ -295,6 +312,7 @@
295
  "decoder_model_merged": {
296
  "op_types": [
297
  "Add",
 
298
  "Concat",
299
  "Constant",
300
  "ConstantOfShape",
 
5
  "encoder_model": {
6
  "op_types": [
7
  "Add",
8
+ "Concat",
9
+ "Constant",
10
  "Conv",
11
  "Div",
12
  "Erf",
13
+ "Gather",
14
  "MatMul",
15
  "Mul",
16
  "Pow",
17
  "ReduceMean",
18
  "Reshape",
19
+ "Shape",
20
  "Softmax",
21
  "Sqrt",
22
  "Sub",
23
+ "Transpose",
24
+ "Unsqueeze"
25
  ],
26
  "weight_type": "QUInt8"
27
  },
 
82
  "decoder_model_merged": {
83
  "op_types": [
84
  "Add",
85
+ "Cast",
86
  "Concat",
87
  "Constant",
88
  "ConstantOfShape",
 
120
  "encoder_model": {
121
  "op_types": [
122
  "Add",
123
+ "Concat",
124
+ "Constant",
125
  "Conv",
126
  "Div",
127
  "Erf",
128
+ "Gather",
129
  "MatMul",
130
  "Mul",
131
  "Pow",
132
  "ReduceMean",
133
  "Reshape",
134
+ "Shape",
135
  "Softmax",
136
  "Sqrt",
137
  "Sub",
138
+ "Transpose",
139
+ "Unsqueeze"
140
  ],
141
  "weight_type": "QInt8"
142
  },
 
197
  "decoder_model_merged": {
198
  "op_types": [
199
  "Add",
200
+ "Cast",
201
  "Concat",
202
  "Constant",
203
  "ConstantOfShape",
 
235
  "encoder_model": {
236
  "op_types": [
237
  "Add",
238
+ "Concat",
239
+ "Constant",
240
  "Conv",
241
  "Div",
242
  "Erf",
243
+ "Gather",
244
  "MatMul",
245
  "Mul",
246
  "Pow",
247
  "ReduceMean",
248
  "Reshape",
249
+ "Shape",
250
  "Softmax",
251
  "Sqrt",
252
  "Sub",
253
+ "Transpose",
254
+ "Unsqueeze"
255
  ],
256
  "weight_type": "QUInt8"
257
  },
 
312
  "decoder_model_merged": {
313
  "op_types": [
314
  "Add",
315
+ "Cast",
316
  "Concat",
317
  "Constant",
318
  "ConstantOfShape",