TheBloke commited on
Commit
db7403c
1 Parent(s): 83c5701

Update for Transformers AWQ support

Browse files
Files changed (1) hide show
  1. config.json +9 -2
config.json CHANGED
@@ -30,5 +30,12 @@
30
  "torch_dtype": "float16",
31
  "transformers_version": "4.34.1",
32
  "use_cache": true,
33
- "vocab_size": 100008
34
- }
 
 
 
 
 
 
 
 
30
  "torch_dtype": "float16",
31
  "transformers_version": "4.34.1",
32
  "use_cache": true,
33
+ "vocab_size": 100008,
34
+ "quantization_config": {
35
+ "quant_method": "awq",
36
+ "zero_point": true,
37
+ "group_size": 128,
38
+ "bits": 4,
39
+ "version": "gemm"
40
+ }
41
+ }