clejordan commited on
Commit
e27eaf8
·
verified ·
1 Parent(s): 329b443

Upload Qwen3ForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +16 -5
  2. model.safetensors +2 -2
config.json CHANGED
@@ -20,7 +20,18 @@
20
  "quantization_config": {
21
  "config_groups": {
22
  "group_0": {
23
- "input_activations": null,
 
 
 
 
 
 
 
 
 
 
 
24
  "output_activations": null,
25
  "targets": [
26
  "Linear"
@@ -29,17 +40,17 @@
29
  "actorder": null,
30
  "block_structure": null,
31
  "dynamic": false,
32
- "group_size": 128,
33
- "num_bits": 4,
34
  "observer": "minmax",
35
  "observer_kwargs": {},
36
- "strategy": "group",
37
  "symmetric": true,
38
  "type": "int"
39
  }
40
  }
41
  },
42
- "format": "pack-quantized",
43
  "global_compression_ratio": null,
44
  "ignore": [
45
  "lm_head"
 
20
  "quantization_config": {
21
  "config_groups": {
22
  "group_0": {
23
+ "input_activations": {
24
+ "actorder": null,
25
+ "block_structure": null,
26
+ "dynamic": true,
27
+ "group_size": null,
28
+ "num_bits": 8,
29
+ "observer": null,
30
+ "observer_kwargs": {},
31
+ "strategy": "token",
32
+ "symmetric": true,
33
+ "type": "int"
34
+ },
35
  "output_activations": null,
36
  "targets": [
37
  "Linear"
 
40
  "actorder": null,
41
  "block_structure": null,
42
  "dynamic": false,
43
+ "group_size": null,
44
+ "num_bits": 8,
45
  "observer": "minmax",
46
  "observer_kwargs": {},
47
+ "strategy": "channel",
48
  "symmetric": true,
49
  "type": "int"
50
  }
51
  }
52
  },
53
+ "format": "int-quantized",
54
  "global_compression_ratio": null,
55
  "ignore": [
56
  "lm_head"
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28f4e35de4c9cfcbd67a6d655fdd2d9dc4b7da11bb6ad1647f580f0b1c2a7640
3
- size 856637120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7acaff9792cb5d9456a90130d4ecaa2e2c5f55d994fae6811daa5b256c6edafb
3
+ size 1064427600