Upload quantized ONNX weights
Browse files- onnx/decoder_model_bnb4.onnx +3 -0
- onnx/decoder_model_fp16.onnx +3 -0
- onnx/decoder_model_int8.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +3 -0
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_quantized.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_quantized.onnx +3 -0
- onnx/decoder_model_uint8.onnx +3 -0
- onnx/decoder_with_past_model_bnb4.onnx +3 -0
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_int8.onnx +3 -0
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_quantized.onnx +3 -0
- onnx/decoder_with_past_model_uint8.onnx +3 -0
- onnx/embed_tokens_bnb4.onnx +3 -0
- onnx/embed_tokens_fp16.onnx +3 -0
- onnx/embed_tokens_int8.onnx +3 -0
- onnx/embed_tokens_q4.onnx +3 -0
- onnx/embed_tokens_quantized.onnx +3 -0
- onnx/embed_tokens_uint8.onnx +3 -0
- onnx/encoder_model_bnb4.onnx +3 -0
- onnx/encoder_model_fp16.onnx +3 -0
- onnx/encoder_model_int8.onnx +3 -0
- onnx/encoder_model_q4.onnx +3 -0
- onnx/encoder_model_quantized.onnx +3 -0
- onnx/encoder_model_uint8.onnx +3 -0
- onnx/vision_encoder_bnb4.onnx +3 -0
- onnx/vision_encoder_fp16.onnx +3 -0
- onnx/vision_encoder_int8.onnx +3 -0
- onnx/vision_encoder_q4.onnx +3 -0
- onnx/vision_encoder_quantized.onnx +3 -0
- onnx/vision_encoder_uint8.onnx +3 -0
onnx/decoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff0b9cfbee73984dfc10833ef5be99a6485f15ecac770f119997b98c75da39ed
|
3 |
+
size 148757128
|
onnx/decoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:059a04344350e80eec87b7a360f77d6d9de27817ebd7ed109f004469b043151f
|
3 |
+
size 510975587
|
onnx/decoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f0f6cd83c057df5da5a0586d3c5483d9135d17537ec876bb8e8ebbf42627f7e
|
3 |
+
size 256816021
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96e701c77fc34737334ed853c07365b2329fe7a2b6a80388b51158e7471e38f0
|
3 |
+
size 149432159
|
onnx/decoder_model_merged_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f007b050621cd1b60392f25a4fe837fb2eda425c11580edd376acc77a369b9b
|
3 |
+
size 511643557
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a87417445e9ecbf0adb68ac0c2c86a7a05f7415b41a45404152528c2dc5d494
|
3 |
+
size 257619797
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d13b29ac7da5a998c73d9d8bf9e9380425dc5d03398a82507831651e1a47a374
|
3 |
+
size 165295714
|
onnx/decoder_model_merged_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a87417445e9ecbf0adb68ac0c2c86a7a05f7415b41a45404152528c2dc5d494
|
3 |
+
size 257619797
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d47062b82f1ae06eeab32445b25b77c07fc4ee97ae636b7fba6185044df6ea
|
3 |
+
size 257619768
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83cb8cead83f91d5c5e4c1ac6a3e20073f96cc9512a6a032c70c2eb704dc21e0
|
3 |
+
size 164621556
|
onnx/decoder_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f0f6cd83c057df5da5a0586d3c5483d9135d17537ec876bb8e8ebbf42627f7e
|
3 |
+
size 256816021
|
onnx/decoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70eed266a19fd4e2d981209232da882431bc2b378cea0921d8db1ac821a53d55
|
3 |
+
size 256816082
|
onnx/decoder_with_past_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c8c17a4be4f6ebb98907194424c77733427441c120065fd4e0ca564a2126be0
|
3 |
+
size 134368512
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7675346298bd4d5a2c3951346e4aa896c2f5f84d28d07fab261291f20d444505
|
3 |
+
size 460467968
|
onnx/decoder_with_past_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:269740e47586ab594ba6e5f36b3582e18394fde8b04846bd2e6a3bc4be21d2dd
|
3 |
+
size 231394266
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a39fca9b7151371ba1f8f78f6e531abfd1cbf9521d5f9597027185ade16ea57
|
3 |
+
size 148660268
|
onnx/decoder_with_past_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:269740e47586ab594ba6e5f36b3582e18394fde8b04846bd2e6a3bc4be21d2dd
|
3 |
+
size 231394266
|
onnx/decoder_with_past_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:537ce27eb955ec77e1ca54476a75c3fd82c602dcc52d554aeffc78a6e03b3e24
|
3 |
+
size 231394313
|
onnx/embed_tokens_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e2d2d452503b2c75683f21e96659a13b3c3da1561ca59a5294ee35f9f49b78c
|
3 |
+
size 210080062
|
onnx/embed_tokens_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:661859f77f1b3f9d2bcdd8eb4fc6e611f48c51abdc55af67de1aa2e0e466ccda
|
3 |
+
size 105040321
|
onnx/embed_tokens_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f64649977559f0f88c5beed562d1f4c1f946f4831d17afe433f2d76a7da2fb6
|
3 |
+
size 52520480
|
onnx/embed_tokens_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e2d2d452503b2c75683f21e96659a13b3c3da1561ca59a5294ee35f9f49b78c
|
3 |
+
size 210080062
|
onnx/embed_tokens_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f64649977559f0f88c5beed562d1f4c1f946f4831d17afe433f2d76a7da2fb6
|
3 |
+
size 52520480
|
onnx/embed_tokens_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70516a87d14ce774a15ca5ec0d8c2bc58c44552959e372196b741bfaa1c3eb70
|
3 |
+
size 52520479
|
onnx/encoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7a71f51c0be8ff2de5bdb19e1c76344d2657c9cc3e0fd29c7280feb7ace1df8
|
3 |
+
size 90015331
|
onnx/encoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53211b7c6fd8dc63422d7423fe637fc7debea665996c08a31352943c2e96b231
|
3 |
+
size 304634480
|
onnx/encoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10f49539850b62d21b80f1d0950359aa6b5e6801378fa8aa968a5eaf2f449448
|
3 |
+
size 152985855
|
onnx/encoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa3fdccdbab224adcfbf3c5df7a95ea89cdffc7e917bac9f8a7879b94560c1f0
|
3 |
+
size 99451927
|
onnx/encoder_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10f49539850b62d21b80f1d0950359aa6b5e6801378fa8aa968a5eaf2f449448
|
3 |
+
size 152985855
|
onnx/encoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6eb30cf8a1ff4af6e79b9858494331a122ac919f7b430bbe41c7f6e22d75d8a2
|
3 |
+
size 152985897
|
onnx/vision_encoder_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3e8e06be761ac08da0fb35f8cf3f2ebea3e9f2cb4a8cc08caefd2119e02fbc8
|
3 |
+
size 294675311
|
onnx/vision_encoder_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e5a26503ed487facd4459cfac85513b6c917dabd021c5ed141f283a0c7e8514
|
3 |
+
size 727422819
|
onnx/vision_encoder_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba1f4c8ca1fcfb0007defae0827a2528f388af79b9f000881d573796af40bb80
|
3 |
+
size 366371735
|
onnx/vision_encoder_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd2949cc69b4ffaaa135e813a0ede5f864a3084322565fafec95eaf17bd304e9
|
3 |
+
size 315744349
|
onnx/vision_encoder_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74aa56d21ce306d559bb8ddef99cf04915c14fd9aa0452f9e39914d5a859fb4e
|
3 |
+
size 366371812
|
onnx/vision_encoder_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74aa56d21ce306d559bb8ddef99cf04915c14fd9aa0452f9e39914d5a859fb4e
|
3 |
+
size 366371812
|