Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +73 -0
- archive/TEST_10_PERCENT_policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/policy_puppetry_attack-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/policy_puppetry_attack-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/policy_puppetry_attack-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/top_1000_sample_5_percent_policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/true_prefix-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/true_prefix_attack_name.db +0 -0
- archive/virtualization-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/virtualization-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- archive/virtualization-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- baseline_true_prefix-Llama-3.2-1B-Instruct.db +3 -0
- baseline_true_prefix-Llama-3.2-3B-Instruct.db +3 -0
- baseline_true_prefix-Qwen2.5-1.5B-Instruct.db +3 -0
- baseline_true_prefix-Qwen2.5-3B-Instruct.db +3 -0
- business_logic-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- business_logic-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- business_logic-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- business_logic-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_policy_puppetry-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_policy_puppetry-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_policy_puppetry-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_policy_puppetry-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
- defend_self_reminder_defense_true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,76 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
archive/TEST_10_PERCENT_policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
archive/fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
archive/fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
archive/fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
archive/fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
archive/ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
archive/ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
archive/ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
archive/ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
archive/policy_puppetry_attack-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
archive/policy_puppetry_attack-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
archive/policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
archive/policy_puppetry_attack-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
archive/top_1000_sample_5_percent_policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
archive/true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
archive/true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
archive/true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
archive/true_prefix-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
archive/virtualization-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
archive/virtualization-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
archive/virtualization-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
baseline_true_prefix-Llama-3.2-1B-Instruct.db filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
baseline_true_prefix-Llama-3.2-3B-Instruct.db filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
baseline_true_prefix-Qwen2.5-1.5B-Instruct.db filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
baseline_true_prefix-Qwen2.5-3B-Instruct.db filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
business_logic-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
business_logic-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
business_logic-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
business_logic-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
defend_self_reminder_defense-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
defend_self_reminder_defense-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
defend_self_reminder_defense-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
defend_self_reminder_defense-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
defend_self_reminder_defense_fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
defend_self_reminder_defense_fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
defend_self_reminder_defense_fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
defend_self_reminder_defense_fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
defend_self_reminder_defense_ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
defend_self_reminder_defense_ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
defend_self_reminder_defense_ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
defend_self_reminder_defense_ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
defend_self_reminder_defense_policy_puppetry-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
defend_self_reminder_defense_policy_puppetry-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
defend_self_reminder_defense_policy_puppetry-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
defend_self_reminder_defense_policy_puppetry-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
defend_self_reminder_defense_true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
defend_self_reminder_defense_true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
defend_self_reminder_defense_true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
defend_self_reminder_defense_true_prefix-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
defend_self_reminder_defense_virtualization-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
defend_self_reminder_defense_virtualization-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
defend_self_reminder_defense_virtualization-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
defend_self_reminder_defense_virtualization-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
policy_puppetry-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
policy_puppetry-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
policy_puppetry-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
policy_puppetry-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
true_prefix-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
virtualization-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
virtualization-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
virtualization-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
| 108 |
+
virtualization-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db filter=lfs diff=lfs merge=lfs -text
|
archive/TEST_10_PERCENT_policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b7671def9b02876620e75d8a49565193d47ecd3b4801a44a964f151b0fbd606
|
| 3 |
+
size 1962946560
|
archive/fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9aaf29890d299f31a6eb8cb69daf52803a2124d202020e03e3454443bd612c31
|
| 3 |
+
size 3158016
|
archive/fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdf71d9995549b4b56033ab14c9846528332fc0e49ec112cfed2f7bab52610b5
|
| 3 |
+
size 3944448
|
archive/fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8f1035008c494fe235e5674c4d679880003ddf41ad280029f859f99ca317081
|
| 3 |
+
size 4993024
|
archive/fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:695f42718edb24fe8ce0deb1dba746e341102b0daa109968a758999b9520b4b8
|
| 3 |
+
size 3158016
|
archive/ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f68f1233cb218d4406566e359c298237258fafdd4a4a8039cc59ac60a242c35f
|
| 3 |
+
size 3158016
|
archive/ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d72a00415e0b054bab33e958145b61605162a230ab21339f73959b94edf98aaa
|
| 3 |
+
size 3944448
|
archive/ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9200c74863ba24cef8f3e9425cb3ee1b3de7fae36f7d7be42c84d091de799d6c
|
| 3 |
+
size 4993024
|
archive/ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf0be6f3fa9acc1c8383d6ae87fa3c51996b53325177c42d82b377b037d45a83
|
| 3 |
+
size 3158016
|
archive/policy_puppetry_attack-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b813dcbe8815bdc0eb71958ad9fff67986ba025ccacf8687af6315053c48ea1
|
| 3 |
+
size 6041600
|
archive/policy_puppetry_attack-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1831c6cb4f33fb92a9e500ae2f38a0f8ab45f11022523dc2209d151dbc55c9e1
|
| 3 |
+
size 6041600
|
archive/policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38f0629a60722959367a7d54c45b26f3c5550d20b0c31bda0ce68b040335cd01
|
| 3 |
+
size 6828032
|
archive/policy_puppetry_attack-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8c3d66a442e998b17dba907c6945b6eba513d6f18f43d5f8f5a8da05cc18f07
|
| 3 |
+
size 6303744
|
archive/top_1000_sample_5_percent_policy_puppetry_attack-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b5b813883cf5bfed1dd94143671117093d259e33ffc78b62bd5191e154c3ad8
|
| 3 |
+
size 1148727296
|
archive/true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2282dcfe86a980be8c9b2ab4c6c6e7809e3dc078c665a2db5c9b72f956f152b
|
| 3 |
+
size 1585152
|
archive/true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:baeb31b361c27bd0b16f97d726b963a45c60c07d9345ecb1f7ef2c4d77ae29ab
|
| 3 |
+
size 3158016
|
archive/true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4691535336c006fdf0621f3cc89269d7d233f3906dd1b967e83a7a237da37842
|
| 3 |
+
size 2633728
|
archive/true_prefix-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc77c3a60e6481f13d96ea73e878115595a8204bc8750894b0a7c27c51532eb7
|
| 3 |
+
size 2895872
|
archive/true_prefix_attack_name.db
ADDED
|
Binary file (12.3 kB). View file
|
|
|
archive/virtualization-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a0238de7cf16d8aef3c54525cbb4865800e4c4d965580d59028d86655cab873
|
| 3 |
+
size 4468736
|
archive/virtualization-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:012613226c11aae479f2d6661d5f8444bf79c92d39369aa671d3232e07ba39f3
|
| 3 |
+
size 3682304
|
archive/virtualization-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea4dd088e86b1c443f7ee786b8d6b6961d02553c41ac8defcfd7441739392415
|
| 3 |
+
size 4206592
|
baseline_true_prefix-Llama-3.2-1B-Instruct.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37ca85f035ab6bae3ecb490aecc5110cad3428f987f5fc220e55b83cfae6209b
|
| 3 |
+
size 3420160
|
baseline_true_prefix-Llama-3.2-3B-Instruct.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ad3ce1453b3e3199528a326403481042af4dcce0a822e9b830795dcee06030d
|
| 3 |
+
size 2895872
|
baseline_true_prefix-Qwen2.5-1.5B-Instruct.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ac1861a31a7e54e346c2f183eb2c0c77294bc455699b5277c9815ee333429a1
|
| 3 |
+
size 1323008
|
baseline_true_prefix-Qwen2.5-3B-Instruct.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd510f010fbe3b375683241f63095449725f3c11026e4145d44af6cfafe0b526
|
| 3 |
+
size 1323008
|
business_logic-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2149e5e726a44a3ed53f82084d9502694896ab4b0a7a8b294d4c80800d14218
|
| 3 |
+
size 2371584
|
business_logic-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58f935ba30f18d87903b175b71676fe5d6bb2e36d554c7108593d05c77fd6f76
|
| 3 |
+
size 1585152
|
business_logic-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ff455ad605428f1b40d85da1b671190f1d4c7bd01e35abfcee97a4dae2b1d93
|
| 3 |
+
size 2371584
|
business_logic-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9df17afd15131ff20f76588e196644aa3addc12e5e3f22b99205c3b5196555b9
|
| 3 |
+
size 2371584
|
defend_self_reminder_defense-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7d419dd25491005739c199f5d9025254380a73948bee56b75558665854faba4
|
| 3 |
+
size 2633728
|
defend_self_reminder_defense-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:894babff5104b071e8a087df1958a86947218edc40856c3d9bac37888562a132
|
| 3 |
+
size 2633728
|
defend_self_reminder_defense-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2203b2f5adb5fad13468c3277c2cc700b6e3185349063f8914e689558789c55
|
| 3 |
+
size 1847296
|
defend_self_reminder_defense-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:edc71218369bc197bc2938f271473c1f330edc1cb49a549c4ce2cdee21184af7
|
| 3 |
+
size 2895872
|
defend_self_reminder_defense_fake_completion-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89031b097e8bc19a6e65e9863a5e62997cad86e4aa8ad361ae52bc7ebbc0c53d
|
| 3 |
+
size 2895872
|
defend_self_reminder_defense_fake_completion-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d9d8d7240b6b3a2fb8fb5b2c8cfe1d14822533efca1560383bc7cf7a6a4bcb0
|
| 3 |
+
size 2895872
|
defend_self_reminder_defense_fake_completion-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85b1332cd49c36c3161dbfd13909d6726213b0e24f2ef4fee925db32470d589c
|
| 3 |
+
size 4730880
|
defend_self_reminder_defense_fake_completion-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f68aa78bc9e55168c212aa903c65f64add77dd3333cc5935156e2497ae9f276d
|
| 3 |
+
size 4730880
|
defend_self_reminder_defense_ignore_all_previous_instructions-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07a304feddd25b6c013f4831d0d2b0b74d7a52d24c992e9d03d9d1ddf93335f2
|
| 3 |
+
size 3682304
|
defend_self_reminder_defense_ignore_all_previous_instructions-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47d41941ff105ba40ae96dce08b807506095b2e3acdae2df1b62f1d8a312dff4
|
| 3 |
+
size 3420160
|
defend_self_reminder_defense_ignore_all_previous_instructions-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2b78687d24ce45266a4ab99ff14f42470705206e21c446f2ad0d6c0a0ec6c78
|
| 3 |
+
size 4993024
|
defend_self_reminder_defense_ignore_all_previous_instructions-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9eb6f884698ca0af28bb106f41ede129a73945fb9bac1903204728c875c50f17
|
| 3 |
+
size 5255168
|
defend_self_reminder_defense_policy_puppetry-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee94ee8ba5fad7bbd1659f76213b54caee8b3b093e95467318856c5015afc0a3
|
| 3 |
+
size 5779456
|
defend_self_reminder_defense_policy_puppetry-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b721b90388cec81874d412b709c7edba2cbd180bbca80ed3b83b5e7fedfcb86
|
| 3 |
+
size 5779456
|
defend_self_reminder_defense_policy_puppetry-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:344b2cbb0e520ae83a9286bf9b902265863377dab4e44b845738fc1ef2e12119
|
| 3 |
+
size 7614464
|
defend_self_reminder_defense_policy_puppetry-Qwen2.5-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6642e64be31df1a73ca51c6b9dce3c0b8ae59400f4fa022fc1ae27f7e6f0826
|
| 3 |
+
size 6565888
|
defend_self_reminder_defense_true_prefix-Llama-3.2-1B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f785a861e394dc1330ac54c9aad0397d1ea572aa87c3cc8a51284cdf8e311e80
|
| 3 |
+
size 1323008
|
defend_self_reminder_defense_true_prefix-Llama-3.2-3B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74693fe5759497714291d20c71681bc335fa85dac271a829c801bf05b9823639
|
| 3 |
+
size 2633728
|
defend_self_reminder_defense_true_prefix-Qwen2.5-1.5B-Instruct-kivedu-unsloth-defaults-fake-pii-349.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:065f10599be43728d29969f9237eeed958b829b51d76959ed4dfc78ee171125d
|
| 3 |
+
size 1847296
|