Mihaiii commited on
Commit
af94f9a
·
verified ·
1 Parent(s): 85d22d8

Upload 8 files

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "TaylorAI/gte-tiny",
3
  "architectures": [
4
  "BertModel"
5
  ],
@@ -17,7 +17,6 @@
17
  "num_hidden_layers": 6,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
- "torch_dtype": "float32",
21
  "transformers_version": "4.40.1",
22
  "type_vocab_size": 2,
23
  "use_cache": true,
 
1
  {
2
+ "_name_or_path": "Mihaiii/jhjghjgh",
3
  "architectures": [
4
  "BertModel"
5
  ],
 
17
  "num_hidden_layers": 6,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
 
20
  "transformers_version": "4.40.1",
21
  "type_vocab_size": 2,
22
  "use_cache": true,
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94991fb91626bd674ec552f4b5be605bfbe705cfb04251098faf10a076f23959
3
+ size 90387629
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ace3cc967f9ac881712ca14e0e290119285baf2114363dcc12a0836d1967790
3
+ size 22972868
quantize_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Cast",
8
+ "Shape",
9
+ "Erf",
10
+ "Sub",
11
+ "Unsqueeze",
12
+ "Add",
13
+ "Sqrt",
14
+ "Concat",
15
+ "Gather",
16
+ "Slice",
17
+ "Softmax",
18
+ "Reshape",
19
+ "Constant",
20
+ "Div",
21
+ "Mul",
22
+ "ReduceMean",
23
+ "Transpose",
24
+ "MatMul",
25
+ "Pow"
26
+ ],
27
+ "weight_type": "QInt8"
28
+ }
29
+ }
30
+ }