Spaces:

holistic-ai
/

AgentGraph

Running

App Files Files Community

wu981526092 commited on Sep 9, 2025

Commit

ef5205a

1 Parent(s): 290f82e

add

Browse files

Files changed (2) hide show

agentgraph/testing/perturbation_types/jailbreak.py +3 -3
extraction_analysis/cot_extraction_20250909_172744_855dfc94.json +139 -0

agentgraph/testing/perturbation_types/jailbreak.py CHANGED Viewed

@@ -43,9 +43,9 @@ def load_jailbreak_techniques() -> List[Dict[str, Any]]:
         techniques = []
         for _, row in df.iterrows():
             techniques.append({
-                'name': row['topic'] if 'topic' in row else 'Unknown',
-                'prompt': row['prompt'] if 'prompt' in row else '',
-                'description': row['source'] if 'source' in row else ''
             })
         logger.info(f"Successfully loaded {len(techniques)} jailbreak techniques from CSV file")

         techniques = []
         for _, row in df.iterrows():
             techniques.append({
+                'name': row.get('name', 'Unknown'),
+                'prompt': row.get('prompt', ''),
+                'description': row.get('description', '')
             })
         logger.info(f"Successfully loaded {len(techniques)} jailbreak techniques from CSV file")

extraction_analysis/cot_extraction_20250909_172744_855dfc94.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+  "timestamp": "20250909_172744",
+  "extraction_id": "855dfc94",
+  "model": "gpt-4o-mini",
+  "reasoning_steps": [],
+  "knowledge_graph": {
+    "system_name": "User Message Response System",
+    "system_summary": "This system is designed to process user messages and generate appropriate responses. The process begins when a user sends a message, which is handled by the `Assistant Agent` (agent_001). The agent undertakes the `Message Processing Task` (task_001) to analyze the user input and generate an output. This collaborative process allows the system to efficiently respond to user inquiries.",
+    "entities": [
+      {
+        "id": "agent_001",
+        "type": "Agent",
+        "name": "Assistant Agent",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 2,
+            "line_end": 2
+          }
+        ]
+      },
+      {
+        "id": "task_001",
+        "type": "Task",
+        "name": "Message Processing Task",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 3,
+            "line_end": 3
+          }
+        ]
+      },
+      {
+        "id": "input_001",
+        "type": "Input",
+        "name": "User Message",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 3,
+            "line_end": 3
+          }
+        ]
+      },
+      {
+        "id": "output_001",
+        "type": "Output",
+        "name": "Agent Response",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 4,
+            "line_end": 4
+          }
+        ]
+      },
+      {
+        "id": "human_001",
+        "type": "Human",
+        "name": "End User",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 3,
+            "line_end": 3
+          }
+        ]
+      }
+    ],
+    "relations": [
+      {
+        "id": "rel_001",
+        "source": "input_001",
+        "target": "agent_001",
+        "type": "CONSUMED_BY",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 2,
+            "line_end": 2
+          }
+        ]
+      },
+      {
+        "id": "rel_002",
+        "source": "agent_001",
+        "target": "task_001",
+        "type": "PERFORMS",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 2,
+            "line_end": 2
+          }
+        ]
+      },
+      {
+        "id": "rel_003",
+        "source": "task_001",
+        "target": "output_001",
+        "type": "PRODUCES",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 4,
+            "line_end": 4
+          }
+        ]
+      },
+      {
+        "id": "rel_004",
+        "source": "output_001",
+        "target": "human_001",
+        "type": "DELIVERS_TO",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 4,
+            "line_end": 4
+          }
+        ]
+      }
+    ],
+    "failures": [],
+    "optimizations": []
+  },
+  "input_trace_length": 184,
+  "input_trace_preview": "<L1> {\n<L2>   \"agent_name\": \"assistant\",\n<L3>   \"input\": \"user message\",\n<L4>   \"output\": \"agent response\",\n<L5>   \"timestamp\": \"2024-08-31\",\n<L6>   \"trace_id\": \"test-trace-123\"\n<L7> }"
+}