Update RT-Qwen3-4B-AWQ with latest interleave_focal checkpoint

Files changed (3) hide show

RT-Qwen3-4B-AWQ/config.json CHANGED Viewed

@@ -75,9 +75,9 @@
           "observer_kwargs": {},
           "scale_dtype": null,
           "strategy": "group",
-          "symmetric": true,
           "type": "int",
-          "zp_dtype": null
         }
       }
     },

           "observer_kwargs": {},
           "scale_dtype": null,
           "strategy": "group",
+          "symmetric": false,
           "type": "int",
+          "zp_dtype": "torch.int8"
         }
       }
     },

RT-Qwen3-4B-AWQ/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e00cef750d0332c56eea1ad8c98fb1f88c83cc8db4dcfc7325894113f121f134
-size 3427191984

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b04e9724acc9898f19eaf88b9c934689e7eacf4c9df569af62815911e4a6532
+size 3441415440

RT-Qwen3-4B-AWQ/recipe.yaml CHANGED Viewed

@@ -3,7 +3,7 @@ default_stage:
     AWQModifier:
       targets: [Linear]
       ignore: [lm_head]
-      scheme: W4A16
       mappings:
       - smooth_layer: re:.*input_layernorm
         balance_layers: ['re:.*q_proj', 're:.*k_proj', 're:.*v_proj']

     AWQModifier:
       targets: [Linear]
       ignore: [lm_head]
+      scheme: W4A16_ASYM
       mappings:
       - smooth_layer: re:.*input_layernorm
         balance_layers: ['re:.*q_proj', 're:.*k_proj', 're:.*v_proj']