TheBloke commited on
Commit
3b12e26
1 Parent(s): 66e15a7

Update for Transformers AWQ support

Browse files
Files changed (1) hide show
  1. config.json +9 -2
config.json CHANGED
@@ -25,5 +25,12 @@
25
  "torch_dtype": "float16",
26
  "transformers_version": "4.34.0",
27
  "use_cache": true,
28
- "vocab_size": 32000
29
- }
 
 
 
 
 
 
 
 
25
  "torch_dtype": "float16",
26
  "transformers_version": "4.34.0",
27
  "use_cache": true,
28
+ "vocab_size": 32000,
29
+ "quantization_config": {
30
+ "quant_method": "awq",
31
+ "zero_point": true,
32
+ "group_size": 128,
33
+ "bits": 4,
34
+ "version": "gemm"
35
+ }
36
+ }