dtransposed commited on
Commit
ee305cf
1 Parent(s): 4f0757b

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +14 -21
config.json CHANGED
@@ -9,26 +9,22 @@
9
  "compression_config": {
10
  "config_groups": {
11
  "group_0": {
12
- "input_activations": null,
13
- "output_activations": null,
14
- "targets": [
15
- "Linear"
16
- ],
17
- "weights": {
18
  "block_structure": null,
19
  "dynamic": false,
20
  "group_size": null,
21
- "num_bits": 4,
22
  "observer": "minmax",
23
  "observer_kwargs": {},
24
- "strategy": "channel",
25
  "symmetric": true,
26
  "type": "int"
27
- }
28
- },
29
- "kv_cache": {
30
- "input_activations": null,
31
- "output_activations": {
 
32
  "block_structure": null,
33
  "dynamic": false,
34
  "group_size": null,
@@ -37,18 +33,15 @@
37
  "observer_kwargs": {},
38
  "strategy": "tensor",
39
  "symmetric": true,
40
- "type": "float"
41
- },
42
- "targets": [
43
- "re:.*k_proj",
44
- "re:.*v_proj"
45
- ],
46
- "weights": null
47
  }
48
  },
49
  "format": "pack-quantized",
50
  "global_compression_ratio": null,
51
- "ignore": [],
 
 
52
  "kv_cache_scheme": {
53
  "block_structure": null,
54
  "dynamic": false,
 
9
  "compression_config": {
10
  "config_groups": {
11
  "group_0": {
12
+ "input_activations": {
 
 
 
 
 
13
  "block_structure": null,
14
  "dynamic": false,
15
  "group_size": null,
16
+ "num_bits": 8,
17
  "observer": "minmax",
18
  "observer_kwargs": {},
19
+ "strategy": "tensor",
20
  "symmetric": true,
21
  "type": "int"
22
+ },
23
+ "output_activations": null,
24
+ "targets": [
25
+ "Linear"
26
+ ],
27
+ "weights": {
28
  "block_structure": null,
29
  "dynamic": false,
30
  "group_size": null,
 
33
  "observer_kwargs": {},
34
  "strategy": "tensor",
35
  "symmetric": true,
36
+ "type": "int"
37
+ }
 
 
 
 
 
38
  }
39
  },
40
  "format": "pack-quantized",
41
  "global_compression_ratio": null,
42
+ "ignore": [
43
+ "lm_head"
44
+ ],
45
  "kv_cache_scheme": {
46
  "block_structure": null,
47
  "dynamic": false,