atrost
/

test_steerable_hf_model_v3

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:67d6bb370e3a52fedc360ffceab7c797adf494f3672773e8c7acd54f7c10d712
 size 3555597480

 version https://git-lfs.github.com/spec/v1
+oid sha256:31141725b3f01ee2f06dc199d77890c5e24603c760dc70a2823bfe27f3ad6866
 size 3555597480

qwen2_postblock_steering_fixed.py CHANGED Viewed

@@ -59,11 +59,11 @@ class Qwen2DecoderLayerPostBlockSteering(Qwen2DecoderLayer):
         self,
         config,
         layer_idx: int,
-        enable: bool,
-        rank: int,
-        alpha: float,
-        activation: str,
-        apply_to: str,
     ):
         super().__init__(config, layer_idx)
         assert apply_to in ("last", "all")

         self,
         config,
         layer_idx: int,
+        enable: bool = True,
+        rank: int = 8,
+        alpha: float = 1.0,
+        activation: str = "silu",
+        apply_to: str = "all",
     ):
         super().__init__(config, layer_idx)
         assert apply_to in ("last", "all")