Xenova HF staff commited on
Commit
0b62d66
1 Parent(s): 12868d2

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -26,7 +26,7 @@
26
  "num_memory_blocks": 0,
27
  "pad_token_id": 0,
28
  "position_embedding_type": "absolute",
29
- "transformers_version": "4.29.2",
30
  "type_vocab_size": 2,
31
  "vocab_size": 30000
32
  }
 
26
  "num_memory_blocks": 0,
27
  "pad_token_id": 0,
28
  "position_embedding_type": "absolute",
29
+ "transformers_version": "4.33.0.dev0",
30
  "type_vocab_size": 2,
31
  "vocab_size": 30000
32
  }
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:531ee3021dbd2dab6961615185c321e405beb1bc93a006503dd41726973d2021
3
- size 83301256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae56917c8df36bced2a7b197ead8006bf47d7f4c771c015badd55f877c6f1c26
3
+ size 67941384
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b3851bd633c37472ce90602a98f0d5cefebf1f5c1537121924b39ffcf95ee71
3
- size 72328456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d422074eb8acca46b98bd4761ce4b4e14eab86d3fc87dcd7d4d7b3192f0efd34
3
+ size 68337949
quantize_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Sqrt",
8
+ "Constant",
9
+ "Reshape",
10
+ "Shape",
11
+ "Slice",
12
+ "Div",
13
+ "Cast",
14
+ "Sub",
15
+ "MatMul",
16
+ "Gather",
17
+ "Unsqueeze",
18
+ "Softmax",
19
+ "Pow",
20
+ "Transpose",
21
+ "Tanh",
22
+ "Concat",
23
+ "ReduceMean",
24
+ "Mul",
25
+ "Identity",
26
+ "Add"
27
+ ],
28
+ "weight_type": "QInt8"
29
+ }
30
+ }
31
+ }