keko24 commited on
Commit
a0c1986
·
verified ·
1 Parent(s): a550fe0

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +43 -1
config.json CHANGED
@@ -17,6 +17,48 @@
17
  "num_attention_heads": 16,
18
  "num_hidden_layers": 28,
19
  "num_key_value_heads": 8,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20
  "rms_norm_eps": 1e-06,
21
  "rope_scaling": null,
22
  "rope_theta": 1000000,
@@ -27,4 +69,4 @@
27
  "use_cache": true,
28
  "use_sliding_window": false,
29
  "vocab_size": 151936
30
- }
 
17
  "num_attention_heads": 16,
18
  "num_hidden_layers": 28,
19
  "num_key_value_heads": 8,
20
+ "quantization_config": {
21
+ "config_groups": {
22
+ "group_1": {
23
+ "input_activations": {
24
+ "actorder": null,
25
+ "block_structure": null,
26
+ "dynamic": true,
27
+ "group_size": null,
28
+ "num_bits": 8,
29
+ "observer": null,
30
+ "observer_kwargs": {},
31
+ "strategy": "token",
32
+ "symmetric": true,
33
+ "type": "int"
34
+ },
35
+ "output_activations": null,
36
+ "targets": [
37
+ "Linear"
38
+ ],
39
+ "weights": {
40
+ "actorder": null,
41
+ "block_structure": null,
42
+ "dynamic": false,
43
+ "group_size": 128,
44
+ "num_bits": 4,
45
+ "observer": "minmax",
46
+ "observer_kwargs": {},
47
+ "strategy": "group",
48
+ "symmetric": true,
49
+ "type": "int"
50
+ }
51
+ }
52
+ },
53
+ "format": "pack-quantized",
54
+ "global_compression_ratio": null,
55
+ "ignore": [
56
+ "lm_head"
57
+ ],
58
+ "kv_cache_scheme": null,
59
+ "quant_method": "compressed-tensors",
60
+ "quantization_status": "compressed"
61
+ },
62
  "rms_norm_eps": 1e-06,
63
  "rope_scaling": null,
64
  "rope_theta": 1000000,
 
69
  "use_cache": true,
70
  "use_sliding_window": false,
71
  "vocab_size": 151936
72
+ }