Upload folder using huggingface_hub
Browse files- config.json +20 -0
- model.safetensors +2 -2
- recipe.yaml +1 -1
config.json
CHANGED
|
@@ -76,6 +76,26 @@
|
|
| 76 |
"format": "pack-quantized",
|
| 77 |
"global_compression_ratio": null,
|
| 78 |
"ignore": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 79 |
"lm_head"
|
| 80 |
],
|
| 81 |
"kv_cache_scheme": null,
|
|
|
|
| 76 |
"format": "pack-quantized",
|
| 77 |
"global_compression_ratio": null,
|
| 78 |
"ignore": [
|
| 79 |
+
"model.layers.0.conv.in_proj",
|
| 80 |
+
"model.layers.0.conv.out_proj",
|
| 81 |
+
"model.layers.1.conv.in_proj",
|
| 82 |
+
"model.layers.1.conv.out_proj",
|
| 83 |
+
"model.layers.3.conv.in_proj",
|
| 84 |
+
"model.layers.3.conv.out_proj",
|
| 85 |
+
"model.layers.4.conv.in_proj",
|
| 86 |
+
"model.layers.4.conv.out_proj",
|
| 87 |
+
"model.layers.6.conv.in_proj",
|
| 88 |
+
"model.layers.6.conv.out_proj",
|
| 89 |
+
"model.layers.7.conv.in_proj",
|
| 90 |
+
"model.layers.7.conv.out_proj",
|
| 91 |
+
"model.layers.9.conv.in_proj",
|
| 92 |
+
"model.layers.9.conv.out_proj",
|
| 93 |
+
"model.layers.11.conv.in_proj",
|
| 94 |
+
"model.layers.11.conv.out_proj",
|
| 95 |
+
"model.layers.13.conv.in_proj",
|
| 96 |
+
"model.layers.13.conv.out_proj",
|
| 97 |
+
"model.layers.15.conv.in_proj",
|
| 98 |
+
"model.layers.15.conv.out_proj",
|
| 99 |
"lm_head"
|
| 100 |
],
|
| 101 |
"kv_cache_scheme": null,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18f84bbf9b45b9a9a03378d301e588bab8ccad63ab216b5e2382042a2cc4e833
|
| 3 |
+
size 1320385384
|
recipe.yaml
CHANGED
|
@@ -2,7 +2,7 @@ default_stage:
|
|
| 2 |
default_modifiers:
|
| 3 |
AWQModifier:
|
| 4 |
targets: [Linear]
|
| 5 |
-
ignore: [lm_head]
|
| 6 |
scheme: W4A16
|
| 7 |
mappings:
|
| 8 |
- smooth_layer: re:.*layers\.(2|5|8|10|12|14)\.operator_norm$
|
|
|
|
| 2 |
default_modifiers:
|
| 3 |
AWQModifier:
|
| 4 |
targets: [Linear]
|
| 5 |
+
ignore: [lm_head, 're:.*conv\.in_proj.*', 're:.*conv\.out_proj.*']
|
| 6 |
scheme: W4A16
|
| 7 |
mappings:
|
| 8 |
- smooth_layer: re:.*layers\.(2|5|8|10|12|14)\.operator_norm$
|