Upload folder using huggingface_hub

Browse files

Files changed (12) hide show

config.json +2 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
onnx/encoder_model.onnx +1 -1
onnx/encoder_model_quantized.onnx +2 -2
quantize_config.json +139 -0
tokenizer_config.json +1 -0

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "MT5ForConditionalGeneration"
   ],
   "d_ff": 2048,
   "d_kv": 64,
   "d_model": 768,
@@ -25,7 +26,7 @@
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
   "tokenizer_class": "T5Tokenizer",
-  "transformers_version": "4.28.1",
   "use_cache": true,
   "vocab_size": 250112
 }

   "architectures": [
     "MT5ForConditionalGeneration"
   ],
+  "classifier_dropout": 0.0,
   "d_ff": 2048,
   "d_kv": 64,
   "d_model": 768,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
   "tokenizer_class": "T5Tokenizer",
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 250112
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.28.1"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:446c4420b33340663588efa44f4edd9a80cd52efb7605afe7d198e3667027b27
-size 1990142970

 version https://git-lfs.github.com/spec/v1
+oid sha256:c48668239d5c97066b00a0dd7c78d618f45ba9e1911daced0ad2cc9a5c915783
+size 1990142661

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a30cc06a6ada3c522caeb065280348eadadda31e7e94db38feb792a6eae83763
-size 1990477278

 version https://git-lfs.github.com/spec/v1
+oid sha256:4823de9d05f2cdcf8743e29f9b7d72f5374d6899a6240144a53c48009d90a0ef
+size 1990476587

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a5ad041f1f348d8654671e0e88f119f00fd38dec9c5de8719538ed13ce64927
-size 498742113

 version https://git-lfs.github.com/spec/v1
+oid sha256:c456eabc1724752ff14267e84f6d3b7b5e7757873cf6ae82c916a49ccc4efce0
+size 500652976

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7cc5d67b457cb18a5b59361839f9ae9185ac120693d97f1370e436645a80e20d
-size 498165142

 version https://git-lfs.github.com/spec/v1
+oid sha256:07cde49811938805c3e59fc87608aba75c408a2d9a4827e73e5fe33b87057911
+size 500076462

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edb08cc4d61361168917ce3d099ba53546e7097ddf465fa0bfeb0eedd7ba356c
-size 1933491316

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed18f6622a1c609c54ba3850ff93a39574192733469eaa143d799244007ad0cd
+size 1933491009

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b9b489c732aae00276bf020389d4abdaecf00d4f58019e035ecffc5667541aba
-size 483948445

 version https://git-lfs.github.com/spec/v1
+oid sha256:eb11ef4ba08e9ed766c1f0ffdc468fa8666da08b6e01a4be337555eae769bd5b
+size 485767496

onnx/encoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c9d15e3a303f7059a0ddb3e5af4ebaf74343f7c0f81fd9de174f5666c07df0c
 size 1108344238

 version https://git-lfs.github.com/spec/v1
+oid sha256:76b26f34b6bd3834064d5ac9b6ac2695367b6db43816b9ffea3ccb2938d6552c
 size 1108344238

onnx/encoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dccaebf4dec740d215e310dc7dc86540fcc0ced03d2a64fb7aff96b4a42b7f91
-size 277437491

 version https://git-lfs.github.com/spec/v1
+oid sha256:96011ec0b2e27757156d4d2d933b74a317d59558b6415387834fca9eab516a7d
+size 277914071

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Gather",
+                "Where",
+                "Concat",
+                "Tanh",
+                "Min",
+                "Tile",
+                "Cast",
+                "Shape",
+                "Pow",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "Less",
+                "Softmax",
+                "Range",
+                "MatMul",
+                "Add",
+                "Transpose",
+                "Reshape",
+                "ConstantOfShape",
+                "LessOrEqual",
+                "ReduceMean",
+                "Expand",
+                "Sub",
+                "Unsqueeze",
+                "Constant",
+                "Div",
+                "Neg"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Gather",
+                "Where",
+                "Concat",
+                "Tanh",
+                "Min",
+                "Cast",
+                "Shape",
+                "Pow",
+                "Greater",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "Less",
+                "Softmax",
+                "Range",
+                "MatMul",
+                "Add",
+                "Transpose",
+                "Reshape",
+                "ConstantOfShape",
+                "ReduceMean",
+                "Sub",
+                "Abs",
+                "Unsqueeze",
+                "Constant",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Gather",
+                "Where",
+                "Concat",
+                "Tanh",
+                "Min",
+                "Tile",
+                "Cast",
+                "Shape",
+                "Pow",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "Less",
+                "Softmax",
+                "Range",
+                "MatMul",
+                "Add",
+                "Transpose",
+                "Reshape",
+                "Slice",
+                "ConstantOfShape",
+                "If",
+                "LessOrEqual",
+                "ReduceMean",
+                "Expand",
+                "Sub",
+                "Unsqueeze",
+                "Constant",
+                "Div",
+                "Neg"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Gather",
+                "Where",
+                "Concat",
+                "Tanh",
+                "Min",
+                "Tile",
+                "Cast",
+                "Shape",
+                "Pow",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "Less",
+                "Softmax",
+                "Range",
+                "MatMul",
+                "Add",
+                "Transpose",
+                "Reshape",
+                "Slice",
+                "ConstantOfShape",
+                "LessOrEqual",
+                "ReduceMean",
+                "Expand",
+                "Sub",
+                "Unsqueeze",
+                "Constant",
+                "Div",
+                "Neg"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

tokenizer_config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 0,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 0,
+  "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},