casperhansen
commited on
Commit
•
a182ae0
1
Parent(s):
f8ce961
Update config.json
Browse files- config.json +7 -0
config.json
CHANGED
@@ -26,6 +26,13 @@
|
|
26 |
"n_head": 71,
|
27 |
"n_layer": 32,
|
28 |
"parallel_attn": true,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
29 |
"torch_dtype": "float16",
|
30 |
"transformers_version": "4.31.0",
|
31 |
"use_cache": true,
|
|
|
26 |
"n_head": 71,
|
27 |
"n_layer": 32,
|
28 |
"parallel_attn": true,
|
29 |
+
"quantization_config": {
|
30 |
+
"bits": 4,
|
31 |
+
"group_size": 64,
|
32 |
+
"quant_method": "awq",
|
33 |
+
"version": "gemm",
|
34 |
+
"zero_point": true
|
35 |
+
},
|
36 |
"torch_dtype": "float16",
|
37 |
"transformers_version": "4.31.0",
|
38 |
"use_cache": true,
|