Upload folder using huggingface_hub

Browse files

Files changed (12) hide show

config.json +2 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
onnx/encoder_model.onnx +1 -1
onnx/encoder_model_quantized.onnx +2 -2
quantize_config.json +139 -0
tokenizer_config.json +1 -0

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "T5ForConditionalGeneration"
   ],
   "d_ff": 2048,
   "d_kv": 64,
   "d_model": 768,
@@ -24,7 +25,7 @@
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
-  "transformers_version": "4.28.1",
   "use_cache": true,
   "vocab_size": 32128
 }

   "architectures": [
     "T5ForConditionalGeneration"
   ],
+  "classifier_dropout": 0.0,
   "d_ff": 2048,
   "d_kv": 64,
   "d_model": 768,
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 32128
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.28.1"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9e72639642edf8be9aed8fa37f41fcbc875b05298d8085e69a66c882a0d0ccd1
-size 650849270

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a04194eb823d83980b9a406346af6accddbfc9ab85068918498253423441f60
+size 650848961

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:091b7fbfce64167d1d12f7a93715d70b7fb1f6adbeb909d04db8fd1855a023b4
-size 651183578

 version https://git-lfs.github.com/spec/v1
+oid sha256:53c515e3977d335e82d140c9521ec34a4ab46286600333cd78b1e60093644d50
+size 651182887

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:834f06b3f58cf5f0e80bc16e03da2993de8bb5e838510abf2bacd280f914177f
-size 163918689

 version https://git-lfs.github.com/spec/v1
+oid sha256:5e5c778efa9cb15f68a18c125443bd38f521c0f3553949599fe145acf437822d
+size 164739632

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73d2f7413a9448d393d15f14b903da496beb31e08cc386818d4eb99e5cd464e7
-size 163341718

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6efcc9a424d07d7e8fd9075bd3c4fb7ea558d608ebf428d4092629d6c784dc3
+size 164163118

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:16e4d5ed1d92934fb3edbd52fccc670da129e27a4d0ae4f2bd2d6227f4aab146
-size 594197616

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4c9d69c4f46e247fbb09b774ed9743a997ad073f13fde1714fa629acfa54d2a
+size 594197309

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:606fcbbea4b79e5c0438859263f1cf2ac236b457039f2892c5901c70bf387b0c
-size 149125021

 version https://git-lfs.github.com/spec/v1
+oid sha256:7fe68a8380083fba399d7983a502d55413315f96c4a45d2f14636c6ddbc8fe72
+size 149854152

onnx/encoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fe3834d4b309ae61774d82839e49e48b2963ec33a484758503bfb5ff8df56fe3
 size 438697388

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c1a769e5283d5ef269b1e8a29f8ba597758231cf82e307bf5fe1efa11681074
 size 438697388

onnx/encoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7aea036f67efffbeb338c918df641a38e5813443664abcc257c212ec9f51a1ca
-size 110025778

 version https://git-lfs.github.com/spec/v1
+oid sha256:3ac4080485da9d051127524c0e375adb109bdd5694a48c96b455b3015046d7bf
+size 110502358

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Constant",
+                "Where",
+                "Tile",
+                "ConstantOfShape",
+                "Expand",
+                "MatMul",
+                "Unsqueeze",
+                "Range",
+                "Transpose",
+                "Tanh",
+                "ReduceMean",
+                "Cast",
+                "Sqrt",
+                "Add",
+                "Neg",
+                "Min",
+                "Log",
+                "Concat",
+                "Div",
+                "Softmax",
+                "Pow",
+                "Shape",
+                "Gather",
+                "Sub",
+                "LessOrEqual",
+                "Mul",
+                "Reshape",
+                "Less"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Constant",
+                "Where",
+                "ConstantOfShape",
+                "MatMul",
+                "Unsqueeze",
+                "Range",
+                "Transpose",
+                "Tanh",
+                "ReduceMean",
+                "Cast",
+                "Sqrt",
+                "Greater",
+                "Add",
+                "Abs",
+                "Min",
+                "Log",
+                "Concat",
+                "Div",
+                "Softmax",
+                "Pow",
+                "Shape",
+                "Gather",
+                "Sub",
+                "Mul",
+                "Reshape",
+                "Less"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Constant",
+                "Where",
+                "Tile",
+                "ConstantOfShape",
+                "Expand",
+                "MatMul",
+                "Unsqueeze",
+                "Range",
+                "Transpose",
+                "Tanh",
+                "ReduceMean",
+                "Cast",
+                "Sqrt",
+                "Slice",
+                "Add",
+                "Neg",
+                "Min",
+                "Log",
+                "Concat",
+                "Div",
+                "Softmax",
+                "Pow",
+                "If",
+                "Shape",
+                "Gather",
+                "Sub",
+                "LessOrEqual",
+                "Mul",
+                "Reshape",
+                "Less"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Constant",
+                "Where",
+                "Tile",
+                "ConstantOfShape",
+                "Expand",
+                "MatMul",
+                "Unsqueeze",
+                "Range",
+                "Transpose",
+                "Tanh",
+                "ReduceMean",
+                "Cast",
+                "Sqrt",
+                "Slice",
+                "Add",
+                "Neg",
+                "Min",
+                "Log",
+                "Concat",
+                "Div",
+                "Softmax",
+                "Pow",
+                "Shape",
+                "Gather",
+                "Sub",
+                "LessOrEqual",
+                "Mul",
+                "Reshape",
+                "Less"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

tokenizer_config.json CHANGED Viewed

@@ -104,6 +104,7 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
+  "legacy": true,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},