subhadip-rotalabs commited on Jan 27

Commit

57f5aee

verified ·

1 Parent(s): 429b851

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

hierarchy_mistral_7b_instruct_v0.2/layer_10.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_10.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_11.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_11.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_12.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_12.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_13.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_13.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_14.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_14.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_15.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_15.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_16.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_16.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_17.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_17.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_18.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_18.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_19.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_19.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/layer_20.json +17 -0
hierarchy_mistral_7b_instruct_v0.2/layer_20.pt +3 -0
hierarchy_mistral_7b_instruct_v0.2/metadata.json +89 -0
hierarchy_qwen3_8b/layer_12.json +17 -0
hierarchy_qwen3_8b/layer_12.pt +3 -0
hierarchy_qwen3_8b/layer_13.json +17 -0
hierarchy_qwen3_8b/layer_13.pt +3 -0
hierarchy_qwen3_8b/layer_14.json +17 -0
hierarchy_qwen3_8b/layer_14.pt +3 -0
hierarchy_qwen3_8b/layer_15.json +17 -0
hierarchy_qwen3_8b/layer_15.pt +3 -0
hierarchy_qwen3_8b/layer_16.json +17 -0
hierarchy_qwen3_8b/layer_16.pt +3 -0
hierarchy_qwen3_8b/layer_17.json +17 -0
hierarchy_qwen3_8b/layer_17.pt +3 -0
hierarchy_qwen3_8b/layer_18.json +17 -0
hierarchy_qwen3_8b/layer_18.pt +3 -0
hierarchy_qwen3_8b/layer_19.json +17 -0
hierarchy_qwen3_8b/layer_19.pt +3 -0
hierarchy_qwen3_8b/layer_20.json +17 -0
hierarchy_qwen3_8b/layer_20.pt +3 -0
hierarchy_qwen3_8b/layer_21.json +17 -0
hierarchy_qwen3_8b/layer_21.pt +3 -0
hierarchy_qwen3_8b/layer_22.json +17 -0
hierarchy_qwen3_8b/layer_22.pt +3 -0
hierarchy_qwen3_8b/layer_23.json +17 -0
hierarchy_qwen3_8b/layer_23.pt +3 -0
hierarchy_qwen3_8b/metadata.json +96 -0
refusal_gemma_2_9b_it/layer_14.json +17 -0
refusal_gemma_2_9b_it/layer_14.pt +3 -0

hierarchy_mistral_7b_instruct_v0.2/layer_10.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 10,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 2.21875,
+    "neg_mean_norm": 1.71875,
+    "vector_norm": 1.171875,
+    "created_at": "2025-12-18T07:56:46.687323"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_10.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1006519eb5b358f74bf30a99c8c627f724ffce4df650344d5598b584f58f97a2
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_11.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 11,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 2.515625,
+    "neg_mean_norm": 1.9453125,
+    "vector_norm": 1.375,
+    "created_at": "2025-12-18T07:56:59.172719"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_11.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ed8a8c8648eb0b563ee51a3c12fa9c0621e04a5971f25d0a59fd748efda92ea
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_12.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 12,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 2.796875,
+    "neg_mean_norm": 2.15625,
+    "vector_norm": 1.59375,
+    "created_at": "2025-12-18T07:57:11.731605"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_12.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:250f67ef20cea1c35b0bff4fc053af114810620e981c6e58f4ae8ebf7d9ce7dd
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_13.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 13,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 3.15625,
+    "neg_mean_norm": 2.515625,
+    "vector_norm": 1.875,
+    "created_at": "2025-12-18T07:57:24.201189"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_13.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4f2c18c7d76db7d6ad80f5b17f562066b71d51e26634501d67c4f585a7d2e1e6
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_14.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 14,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 3.46875,
+    "neg_mean_norm": 2.75,
+    "vector_norm": 2.171875,
+    "created_at": "2025-12-18T07:57:36.698532"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_14.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b1d114124e531ea8bca68532d225a6e4f39cdfe0a634aa83fac6b9f170d9a3a
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_15.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 15,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 4.0,
+    "neg_mean_norm": 3.203125,
+    "vector_norm": 2.515625,
+    "created_at": "2025-12-18T07:57:49.241757"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_15.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c525b49a11073bf3cc35e581882eb059cee3eb90337ab98ec402fbd255b1e6e0
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_16.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 16,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 4.5625,
+    "neg_mean_norm": 3.8125,
+    "vector_norm": 2.796875,
+    "created_at": "2025-12-18T07:58:01.868522"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_16.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e44de7b7d62c10a13d54eaca978cbabf5a0e5b45b88b0341b9a76b9e0c4caa0e
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_17.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 17,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 4.96875,
+    "neg_mean_norm": 4.21875,
+    "vector_norm": 3.25,
+    "created_at": "2025-12-18T07:58:14.433875"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_17.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02714212448839254a5283e4fab3815a3421f790ca793b6c6622b5301a78b604
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_18.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 18,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 5.75,
+    "neg_mean_norm": 5.03125,
+    "vector_norm": 3.671875,
+    "created_at": "2025-12-18T07:58:26.994268"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_18.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2716a6dc3e5be95d59e5f6d3087ef86b4ea6f89432312b3297e2f1202135bd09
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_19.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 19,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 6.375,
+    "neg_mean_norm": 5.65625,
+    "vector_norm": 4.03125,
+    "created_at": "2025-12-18T07:58:39.596522"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_19.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a2891da9226cf5e7848205990cb14a1dbb93a154f0f72bc6a5ad9b136377c03
+size 9776

hierarchy_mistral_7b_instruct_v0.2/layer_20.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 20,
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 7.09375,
+    "neg_mean_norm": 6.375,
+    "vector_norm": 4.40625,
+    "created_at": "2025-12-18T07:58:52.211449"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_mistral_7b_instruct_v0.2/layer_20.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f21a277acc94df368c916e79ba65afdf98c26aa4f8e4e249bcf6985bbf701243
+size 9776

hierarchy_mistral_7b_instruct_v0.2/metadata.json ADDED Viewed

	@@ -0,0 +1,89 @@

+{
+  "behavior": "hierarchy",
+  "model_name": "mistralai/Mistral-7B-Instruct-v0.2",
+  "layers": [
+    10,
+    11,
+    12,
+    13,
+    14,
+    15,
+    16,
+    17,
+    18,
+    19,
+    20
+  ],
+  "best_layer": 15,
+  "best_improvement": 0.25,
+  "num_pairs": 26,
+  "target_direction": "increase",
+  "layer_results": {
+    "10": {
+      "0.0": 0.5,
+      "0.5": 0.75,
+      "1.0": 0.5,
+      "1.5": 0.5
+    },
+    "11": {
+      "0.0": 0.5,
+      "0.5": 0.5,
+      "1.0": 0.5,
+      "1.5": 0.5
+    },
+    "12": {
+      "0.0": 0.5,
+      "0.5": 0.75,
+      "1.0": 0.25,
+      "1.5": 0.5
+    },
+    "13": {
+      "0.0": 0.5,
+      "0.5": 0.5,
+      "1.0": 0.25,
+      "1.5": 0.5
+    },
+    "14": {
+      "0.0": 0.5,
+      "0.5": 0.5,
+      "1.0": 0.5,
+      "1.5": 0.25
+    },
+    "15": {
+      "0.0": 0.5,
+      "0.5": 0.25,
+      "1.0": 0.75,
+      "1.5": 0.5
+    },
+    "16": {
+      "0.0": 0.5,
+      "0.5": 0.5,
+      "1.0": 0.5,
+      "1.5": 0.25
+    },
+    "17": {
+      "0.0": 0.5,
+      "0.5": 0.5,
+      "1.0": 0.75,
+      "1.5": 0.0
+    },
+    "18": {
+      "0.0": 0.5,
+      "0.5": 0.75,
+      "1.0": 0.75,
+      "1.5": 0.5
+    },
+    "19": {
+      "0.0": 0.5,
+      "0.5": 0.5,
+      "1.0": 0.75,
+      "1.5": 0.75
+    },
+    "20": {
+      "0.0": 0.5,
+      "0.5": 0.75,
+      "1.0": 0.75,
+      "1.5": 0.25
+    }
+  }
+}

hierarchy_qwen3_8b/layer_12.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 12,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 57.5,
+    "neg_mean_norm": 53.0,
+    "vector_norm": 16.5,
+    "created_at": "2025-12-18T22:23:00.548285"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_12.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce51034b11b188669eec43728629bb4910b7a172f4c1096bda675c8f4e8f29c1
+size 9776

hierarchy_qwen3_8b/layer_13.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 13,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 57.75,
+    "neg_mean_norm": 52.5,
+    "vector_norm": 17.375,
+    "created_at": "2025-12-18T22:23:13.018805"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_13.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6e78111385cbc647ba93a926857ec0728defacc450004089399612b4040e6ee
+size 9776

hierarchy_qwen3_8b/layer_14.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 14,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 64.0,
+    "neg_mean_norm": 59.5,
+    "vector_norm": 18.25,
+    "created_at": "2025-12-18T22:23:25.489920"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_14.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77e0c227409a6cf799777c3c062be3f8de3bb502486fd4d9a8ac8ad0787b7f06
+size 9776

hierarchy_qwen3_8b/layer_15.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 15,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 64.5,
+    "neg_mean_norm": 59.25,
+    "vector_norm": 20.125,
+    "created_at": "2025-12-18T22:23:37.918916"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_15.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c52325a7cb27e8b27546652ff6ec96617898b552f3bdc3f35e2588277bac3e22
+size 9776

hierarchy_qwen3_8b/layer_16.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 16,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 70.5,
+    "neg_mean_norm": 66.0,
+    "vector_norm": 22.75,
+    "created_at": "2025-12-18T22:23:50.342735"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_16.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f63575f4b03adaca359a235936cad5def59645b5c633eee43a605a3fdc3bb7b4
+size 9776

hierarchy_qwen3_8b/layer_17.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 17,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 79.0,
+    "neg_mean_norm": 72.5,
+    "vector_norm": 24.875,
+    "created_at": "2025-12-18T22:24:02.740801"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_17.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c430e797d25d7da3ae75e29dfb69c9f1086d4b598e1b3c2731fb5b3deb8c0af
+size 9776

hierarchy_qwen3_8b/layer_18.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 18,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 82.0,
+    "neg_mean_norm": 76.0,
+    "vector_norm": 28.5,
+    "created_at": "2025-12-18T22:24:15.178867"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_18.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:413c094daf3f75329afca04e1ef3669d5eabaae2cb96f67ba3d95d8c2c771058
+size 9776

hierarchy_qwen3_8b/layer_19.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 19,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 95.5,
+    "neg_mean_norm": 88.5,
+    "vector_norm": 35.5,
+    "created_at": "2025-12-18T22:24:27.615196"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_19.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:935c01ff2ecd1b7ca76b7216201d9d0aca1ec92d335655547226132418baa919
+size 9776

hierarchy_qwen3_8b/layer_20.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 20,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 102.0,
+    "neg_mean_norm": 97.5,
+    "vector_norm": 38.0,
+    "created_at": "2025-12-18T22:24:40.132334"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_20.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b33e968ee60893fceb743e97b43585079759340346a0446e6d4b98f28b84efb7
+size 9776

hierarchy_qwen3_8b/layer_21.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 21,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 106.5,
+    "neg_mean_norm": 103.0,
+    "vector_norm": 41.75,
+    "created_at": "2025-12-18T22:24:52.616517"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_21.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:355eb6c12243de94f3e020b5d7bf8c512b93f5fef321c4f3af2695c68b5133a5
+size 9776

hierarchy_qwen3_8b/layer_22.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 22,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 131.0,
+    "neg_mean_norm": 127.0,
+    "vector_norm": 50.5,
+    "created_at": "2025-12-18T22:25:05.048245"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_22.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:580cf4c17cb42b36970276ea01be1d4fe720bf4342e179c5eff2c4d31a09497c
+size 9776

hierarchy_qwen3_8b/layer_23.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "instruction_hierarchy",
+  "layer_index": 23,
+  "model_name": "Qwen/Qwen3-8B",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 26,
+    "token_position": "last",
+    "pos_mean_norm": 159.0,
+    "neg_mean_norm": 156.0,
+    "vector_norm": 62.25,
+    "created_at": "2025-12-18T22:25:17.482916"
+  },
+  "vector_shape": [
+    4096
+  ]
+}

hierarchy_qwen3_8b/layer_23.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4cf2b7d9c494448f6350f792048fcd8cce2e810b9e24c4bde228970c18bf3d3c
+size 9776

hierarchy_qwen3_8b/metadata.json ADDED Viewed

	@@ -0,0 +1,96 @@

+{
+  "behavior": "hierarchy",
+  "model_name": "Qwen/Qwen3-8B",
+  "layers": [
+    12,
+    13,
+    14,
+    15,
+    16,
+    17,
+    18,
+    19,
+    20,
+    21,
+    22,
+    23
+  ],
+  "best_layer": 14,
+  "best_improvement": 0.25,
+  "num_pairs": 26,
+  "target_direction": "increase",
+  "layer_results": {
+    "12": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.0,
+      "1.5": 0.25
+    },
+    "13": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.0,
+      "1.5": 0.0
+    },
+    "14": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.25,
+      "1.5": 0.0
+    },
+    "15": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.25,
+      "1.5": 0.5
+    },
+    "16": {
+      "0.0": 0.0,
+      "0.5": 0.0,
+      "1.0": 0.0,
+      "1.5": 0.0
+    },
+    "17": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.25,
+      "1.5": 0.0
+    },
+    "18": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.0,
+      "1.5": 0.25
+    },
+    "19": {
+      "0.0": 0.0,
+      "0.5": 0.0,
+      "1.0": 0.0,
+      "1.5": 0.0
+    },
+    "20": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.25,
+      "1.5": 0.5
+    },
+    "21": {
+      "0.0": 0.0,
+      "0.5": 0.25,
+      "1.0": 0.0,
+      "1.5": 0.0
+    },
+    "22": {
+      "0.0": 0.0,
+      "0.5": 0.0,
+      "1.0": 0.25,
+      "1.5": 0.5
+    },
+    "23": {
+      "0.0": 0.0,
+      "0.5": 0.0,
+      "1.0": 0.25,
+      "1.5": 0.25
+    }
+  }
+}

refusal_gemma_2_9b_it/layer_14.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "behavior": "refusal",
+  "layer_index": 14,
+  "model_name": "google/gemma-2-9b-it",
+  "extraction_method": "caa",
+  "metadata": {
+    "num_pairs": 50,
+    "token_position": "last",
+    "pos_mean_norm": 161.0,
+    "neg_mean_norm": 147.625,
+    "vector_norm": 115.375,
+    "created_at": "2025-12-18T00:57:55.073309"
+  },
+  "vector_shape": [
+    3584
+  ]
+}

refusal_gemma_2_9b_it/layer_14.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bd28df76df8f95e46b419d51abe7b2372be1b1c8676a9224d5bfeeae42f4ee67
+size 8752