Upload optimized ONNX files w/ GQA
Browse files
onnx/decoder_model_merged_fp16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59bff9c12eba82bcc6c6893eacd61118e7d69ec9a1e9595eb66a19db72665dde
|
3 |
+
size 546702610
|
onnx/decoder_model_merged_fp16.onnx_data
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:707a678ab9e378fb739d8574b2668b73e8b7354fb2bc275a34e97b81215c098c
|
3 |
+
size 2080374784
|
onnx/decoder_model_merged_q4.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00e5f3de4b5329d46d90190909a5b53eac6883a616c5f973f433d60756272f3c
|
3 |
+
size 739917026
|
onnx/decoder_model_merged_q4f16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35462bc13ce0af9df13a0233fb3e214cf6587ea6a1c51ab0c8fd616619f7ee1e
|
3 |
+
size 739917090
|