Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +2 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +74 -74
tokenizer.json +0 -0

config.json CHANGED Viewed

@@ -54,7 +54,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 57642
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 57642
 }

generation_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_from_model_config": true,
   "bad_words_ids": [
     [
       57641
@@ -12,5 +11,6 @@
   "max_length": 512,
   "num_beams": 6,
   "pad_token_id": 57641,
-  "transformers_version": "4.32.0.dev0"
 }

 {
   "bad_words_ids": [
     [
       57641
   "max_length": 512,
   "num_beams": 6,
   "pad_token_id": 57641,
+  "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e1693efe660470bd8adbfe3296b37b0bc1d9be33d8d6e369528c1e5f8308a23a
-size 338553760

 version https://git-lfs.github.com/spec/v1
+oid sha256:07342521a547809bb38ab91a0939cc763c8373330f7670e9d86d8e7fc0065cb7
+size 220503001

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ac5a1d5e1401574c835a1c0acdac5074f57b72cb25160c0c84a5caac97d6ef3
-size 338789242

 version https://git-lfs.github.com/spec/v1
+oid sha256:fad840794c922b7a83fe958fc2c88255c09bcf12cb1cb4099a31711017e34091
+size 220738568

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d9c4fba6ac26690f6325dde5643a68b9d96bc214b44dbe85f5f9cd4c5903ed8d
-size 86217886

 version https://git-lfs.github.com/spec/v1
+oid sha256:7915cb6d03674552b6f7a3bcd4fe04e4dedd2a16fc120b4bcab39a03c6e6ecb4
+size 56415560

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3139e0482d113a31a14514cf48b734121ab07fa252bfd42e97a8f784bbe75aa7
-size 85846530

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c5b9b864ee0628850d7f50ed24f8da3b0fddef285ffe23724d21fb0ac564c02
+size 56044858

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1684ed2ead95e4346e0d082dd77ef54eccd589c37125eae1ac4432b71bd8976e
-size 325903251

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ceccaef9e3fa65b633f1a5283c1d4b81761cd2bd18b86f2bede63a0dd1a48ca
+size 207852492

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:645dd32b8c1dd06dd1c5149405a2b3963bb72d99915723d5d030f074b67baf23
-size 82575066

 version https://git-lfs.github.com/spec/v1
+oid sha256:619507f34314419c196b4edd6fed2503730282bfd5df8bbba7ff7f743bb80e09
+size 52773394

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "Sqrt",
                 "Unsqueeze",
-                "Range",
                 "Equal",
                 "Sub",
                 "ConstantOfShape",
                 "Pow",
                 "Constant",
-                "Sigmoid",
-                "Reshape",
-                "MatMul",
-                "Div",
-                "Shape",
-                "ReduceMean",
-                "Cast",
-                "Gather",
-                "Where",
-                "Add",
-                "Expand",
-                "Transpose",
-                "Concat",
-                "Softmax",
-                "Mul"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Sqrt",
                 "Unsqueeze",
                 "Equal",
                 "Sub",
                 "Range",
                 "ConstantOfShape",
                 "Pow",
                 "Constant",
-                "Sigmoid",
-                "Reshape",
-                "MatMul",
-                "Div",
-                "Shape",
-                "ReduceMean",
-                "Cast",
-                "Gather",
-                "Where",
-                "Add",
-                "Expand",
-                "Transpose",
-                "Concat",
-                "Softmax",
-                "Mul"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
                 "Slice",
-                "Sqrt",
                 "Unsqueeze",
-                "Range",
                 "Equal",
                 "Sub",
                 "ConstantOfShape",
                 "Pow",
                 "Constant",
-                "Sigmoid",
-                "Reshape",
-                "Less",
-                "MatMul",
-                "Div",
-                "Shape",
-                "ReduceMean",
-                "Cast",
-                "Gather",
-                "Where",
-                "Add",
-                "Expand",
-                "Transpose",
-                "Concat",
-                "Softmax",
-                "Mul",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
                 "Slice",
-                "Sqrt",
                 "Unsqueeze",
-                "Range",
                 "Equal",
                 "Sub",
                 "ConstantOfShape",
                 "Pow",
                 "Constant",
-                "Sigmoid",
-                "Reshape",
-                "Less",
-                "MatMul",
-                "Div",
-                "Shape",
-                "ReduceMean",
-                "Cast",
-                "Gather",
-                "If",
-                "Where",
-                "Add",
-                "Expand",
-                "Transpose",
-                "Concat",
-                "Softmax",
-                "Mul",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Add",
+                "Mul",
+                "ReduceMean",
                 "Unsqueeze",
+                "MatMul",
+                "Transpose",
                 "Equal",
+                "Expand",
+                "Sqrt",
+                "Div",
                 "Sub",
+                "Where",
+                "Gather",
+                "Concat",
+                "Cast",
+                "Range",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Shape",
+                "Reshape",
                 "Pow",
                 "Constant",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Add",
+                "Mul",
+                "ReduceMean",
                 "Unsqueeze",
+                "MatMul",
+                "Transpose",
                 "Equal",
+                "Expand",
+                "Sqrt",
+                "Div",
                 "Sub",
+                "Where",
+                "Gather",
+                "Concat",
+                "Cast",
                 "Range",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Shape",
+                "Reshape",
                 "Pow",
                 "Constant",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Add",
+                "Mul",
+                "Squeeze",
                 "Slice",
+                "ReduceMean",
                 "Unsqueeze",
+                "MatMul",
+                "Less",
+                "If",
                 "Equal",
+                "Transpose",
+                "Expand",
+                "Sqrt",
+                "Div",
                 "Sub",
+                "Where",
+                "Gather",
+                "Concat",
+                "Cast",
+                "Range",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Shape",
+                "Reshape",
                 "Pow",
                 "Constant",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Add",
+                "Mul",
+                "Squeeze",
                 "Slice",
+                "ReduceMean",
                 "Unsqueeze",
+                "MatMul",
+                "Less",
+                "Transpose",
                 "Equal",
+                "Expand",
+                "Sqrt",
+                "Div",
                 "Sub",
+                "Where",
+                "Gather",
+                "Concat",
+                "Cast",
+                "Range",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Shape",
+                "Reshape",
                 "Pow",
                 "Constant",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff