Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

config.json +3 -2
generation_config.json +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +73 -73
tokenizer_config.json +2 -1

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "Xenova/llama2.c",
   "architectures": [
     "LlamaForCausalLM"
   ],
@@ -17,8 +17,9 @@
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": null,
   "tie_word_embeddings": false,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 32000
 }

 {
+  "_name_or_path": "Xenova/llama2.c-stories15M",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": null,
+  "rope_theta": 10000.0,
   "tie_word_embeddings": false,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.32.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee3d45805b922adb525ec778db4b2692db680561df445eebc94fce85d88985e2
 size 98260154

 version https://git-lfs.github.com/spec/v1
+oid sha256:6816b265a96d80bb85a622c394dc819b269680f327b82ea64f3c77f32117d84e
 size 98260154

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ab44c99230849a428c3e3f7fb2e91b05f5b4642c19a1ec5d3877f8302cd1689
-size 25528662

 version https://git-lfs.github.com/spec/v1
+oid sha256:473abf17f5284a881ea1086cfead870211b933365a91cead05e2274f94b7d5cb
+size 25279161

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a16c83ee7a1904271ba34b81d4f8e978cfd8cef34d99245e2453aff29d90c22
-size 25098988

 version https://git-lfs.github.com/spec/v1
+oid sha256:83c62704973668509b573854d3c24d3d47322db722538f0ce6064bc9f425802e
+size 24849487

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:652587ee72f73418d7816f093df492ad8005ddcf3fc970885f7658ade6a2bca8
-size 25098621

 version https://git-lfs.github.com/spec/v1
+oid sha256:dafb7a1a57c760eac3203352c6db49456532166dca7ff046bdb5b7127d3eadec
+size 24849120

quantize_config.json CHANGED Viewed

@@ -1,105 +1,105 @@
 {
-    "per_channel": true,
-    "reduce_range": true,
     "per_model_config": {
-        "decoder_model_merged": {
             "op_types": [
-                "Unsqueeze",
                 "Sigmoid",
-                "Concat",
-                "Expand",
                 "Transpose",
-                "Shape",
-                "Range",
-                "Constant",
                 "Neg",
-                "If",
-                "Cast",
                 "Softmax",
-                "Gather",
-                "Add",
-                "Equal",
-                "Reshape",
-                "MatMul",
-                "ConstantOfShape",
                 "Div",
-                "Slice",
-                "Sub",
-                "Mul",
-                "Where",
                 "Less",
-                "Pow",
-                "ReduceMean",
-                "Sqrt",
-                "Squeeze",
-                "Identity"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Unsqueeze",
                 "Sigmoid",
-                "Concat",
-                "Expand",
                 "Transpose",
-                "Shape",
-                "Range",
-                "Constant",
                 "Neg",
-                "If",
-                "Cast",
                 "Softmax",
                 "Gather",
-                "Add",
-                "Equal",
-                "Reshape",
                 "MatMul",
-                "ConstantOfShape",
-                "Div",
-                "Slice",
-                "Sub",
-                "Mul",
-                "Where",
-                "Pow",
-                "ReduceMean",
-                "Sqrt",
-                "Squeeze",
-                "Identity"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Unsqueeze",
                 "Sigmoid",
-                "Concat",
-                "Expand",
                 "Transpose",
-                "Shape",
-                "Range",
-                "Constant",
                 "Neg",
-                "If",
-                "Cast",
                 "Softmax",
                 "Gather",
-                "Add",
-                "Equal",
-                "Reshape",
                 "MatMul",
-                "ConstantOfShape",
-                "Div",
-                "Slice",
-                "Sub",
-                "Mul",
-                "Where",
-                "Less",
-                "Pow",
-                "ReduceMean",
-                "Sqrt",
-                "Squeeze",
-                "Identity"
             ],
             "weight_type": "QInt8"
         }

 {
+    "per_channel": false,
+    "reduce_range": false,
     "per_model_config": {
+        "decoder_model": {
             "op_types": [
+                "Squeeze",
+                "Identity",
+                "Constant",
+                "Add",
+                "Pow",
+                "ConstantOfShape",
+                "If",
+                "Reshape",
+                "Sqrt",
+                "Equal",
+                "Where",
                 "Sigmoid",
+                "Sub",
+                "ReduceMean",
                 "Transpose",
+                "Slice",
                 "Neg",
                 "Softmax",
+                "Range",
+                "Shape",
                 "Div",
+                "Gather",
+                "Concat",
+                "Expand",
+                "Cast",
                 "Less",
+                "Unsqueeze",
+                "MatMul",
+                "Mul"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Squeeze",
+                "Identity",
+                "Constant",
+                "Add",
+                "Pow",
+                "ConstantOfShape",
+                "If",
+                "Reshape",
+                "Sqrt",
+                "Equal",
+                "Where",
                 "Sigmoid",
+                "Sub",
+                "ReduceMean",
                 "Transpose",
+                "Slice",
                 "Neg",
                 "Softmax",
+                "Range",
+                "Shape",
+                "Div",
                 "Gather",
+                "Concat",
+                "Expand",
+                "Cast",
+                "Less",
+                "Unsqueeze",
                 "MatMul",
+                "Mul"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
+                "Squeeze",
+                "Identity",
+                "Constant",
+                "Add",
+                "Pow",
+                "ConstantOfShape",
+                "If",
+                "Reshape",
+                "Sqrt",
+                "Where",
+                "Equal",
                 "Sigmoid",
+                "Sub",
+                "ReduceMean",
                 "Transpose",
+                "Slice",
                 "Neg",
                 "Softmax",
+                "Range",
+                "Shape",
+                "Div",
                 "Gather",
+                "Concat",
+                "Expand",
+                "Cast",
+                "Unsqueeze",
                 "MatMul",
+                "Mul"
             ],
             "weight_type": "QInt8"
         }

tokenizer_config.json CHANGED Viewed

@@ -27,5 +27,6 @@
     "normalized": true,
     "rstrip": false,
     "single_word": false
-  }
 }

     "normalized": true,
     "rstrip": false,
     "single_word": false
+  },
+  "use_default_system_prompt": true
 }