steerapi commited on
Commit
14fcf70
1 Parent(s): 7b8493c

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -40,3 +40,4 @@ Constant_170_attr__value filter=lfs diff=lfs merge=lfs -text
40
  onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
41
  onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
42
  onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
40
  onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
41
  onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
42
  onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
43
+ onnx/decoder_model_merged_quantized.onnx.data filter=lfs diff=lfs merge=lfs -text
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:390640ee46632eb998ed966347c2f6acfddad5ea04aad9e7f9e528d241dacf0c
3
+ size 19045741
onnx/decoder_model_merged_quantized.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d312201a36ec7d97cac2fc87c664ef0ec16a681f55ec013b9e3ce383904411e4
3
+ size 6739214336
onnx/quantize_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "use_external_data_format": true,
5
+ "per_model_config": {
6
+ "decoder_model_merged": {
7
+ "op_types": [
8
+ "Cast",
9
+ "Sigmoid",
10
+ "If",
11
+ "Shape",
12
+ "Gather",
13
+ "Squeeze",
14
+ "Pow",
15
+ "Sub",
16
+ "Identity",
17
+ "Unsqueeze",
18
+ "MatMul",
19
+ "ReduceMean",
20
+ "Constant",
21
+ "Equal",
22
+ "Sqrt",
23
+ "Expand",
24
+ "Add",
25
+ "Range",
26
+ "Less",
27
+ "Div",
28
+ "ConstantOfShape",
29
+ "Where",
30
+ "Transpose",
31
+ "Mul",
32
+ "Slice",
33
+ "Softmax",
34
+ "Neg",
35
+ "Concat",
36
+ "Reshape"
37
+ ],
38
+ "weight_type": "QInt8"
39
+ }
40
+ }
41
+ }