narcolepticchicken
/

occ-stack

ml-intern

Model card Files Files and versions

xet

Community

narcolepticchicken commited on 26 days ago

Commit

8ee1677

verified ·

1 Parent(s): ea66c97

Upload notebook_walkthrough.ipynb

Browse files

Files changed (1) hide show

notebook_walkthrough.ipynb +120 -45

notebook_walkthrough.ipynb CHANGED Viewed

@@ -6,7 +6,9 @@
    "source": [
     "# OCC Stack Walkthrough\n",
     "\n",
-    "This notebook demonstrates the Oracle-Credit-Compute (OCC) stack for agentic compute allocation."
    ]
   },
   {
@@ -22,7 +24,7 @@
     "from oracle.oracle import ImpactOracle\n",
     "from ledger.ledger import CreditLedger\n",
     "from broker.broker import ResourceBroker, Decision\n",
-    "from rl.reward import RewardHook, OfflineComparator"
    ]
   },
   {
@@ -31,7 +33,8 @@
    "source": [
     "## 1. Impact Oracle\n",
     "\n",
-    "The oracle scores whether an action produced measurable marginal value."
    ]
   },
   {
@@ -42,18 +45,19 @@
    "source": [
     "oracle = ImpactOracle(compute_budget=1e5)\n",
     "\n",
-    "# Score a code attempt\n",
     "result = oracle.score(\n",
     "    mode=\"code\",\n",
-    "    action={\"tokens_used\": 50},\n",
-    "    context={\"previous_passed\": False},\n",
-    "    result={\"passed\": True, \"hidden_passed\": True, \"compute_cost\": 50},\n",
     "    agent_id=\"agent_1\"\n",
     ")\n",
-    "print(f\"Raw score: {result.raw_score}\")\n",
-    "print(f\"Cost-adjusted: {result.cost_adjusted_score}\")\n",
-    "print(f\"Reward: {result.reward_value}\")\n",
-    "print(f\"Reason: {result.reason}\")"
    ]
   },
   {
@@ -62,7 +66,7 @@
    "source": [
     "## 2. Credit Ledger\n",
     "\n",
-    "Credits are non-transferable, decaying, and capability-scoped."
    ]
   },
   {
@@ -73,7 +77,7 @@
    "source": [
     "ledger = CreditLedger(decay_lambda=0.05)\n",
     "\n",
-    "# Agent earns credits\n",
     "ledger.earn(\n",
     "    agent_id=\"agent_1\",\n",
     "    task_id=\"task_1\",\n",
@@ -81,18 +85,23 @@
     "    amount=10.0,\n",
     "    oracle_score=1.0,\n",
     "    compute_cost=50.0,\n",
-    "    reason=\"pass_hidden_test\"\n",
     ")\n",
     "\n",
-    "print(f\"Balance: {ledger.balance('agent_1')}\")\n",
-    "\n",
-    "# Try to transfer (blocked)\n",
     "success = ledger.transfer(\"agent_1\", \"agent_2\", 5.0)\n",
     "print(f\"Transfer succeeded: {success}\")\n",
     "\n",
     "# Spend credits\n",
-    "ok, entry = ledger.spend(\"agent_1\", \"task_1\", \"action_2\", 3.0, reason=\"retrieval_call\")\n",
-    "print(f\"Spend succeeded: {ok}, remaining: {ledger.balance('agent_1')}\")"
    ]
   },
   {
@@ -113,16 +122,20 @@
     "broker = ResourceBroker()\n",
     "\n",
     "# Low credit -> deny\n",
-    "dec = broker.request(\"model_call_large\", \"agent_1\", 1.0)\n",
     "print(f\"Low credit: {dec.decision.value} - {dec.reason}\")\n",
     "\n",
-    "# High credit -> allow (with approval for high-risk)\n",
-    "dec = broker.request(\"model_call_large\", \"agent_1\", 50.0)\n",
     "print(f\"High credit: {dec.decision.value} - {dec.reason}\")\n",
     "\n",
-    "# Gaming detected -> escalate\n",
-    "dec = broker.request(\"file_write\", \"agent_1\", 100.0, agent_flags={\"gaming_score\": 0.6})\n",
-    "print(f\"Gaming: {dec.decision.value} - {dec.reason}\")"
    ]
   },
   {
@@ -131,7 +144,20 @@
    "source": [
     "## 4. GRPO Reward Hook\n",
     "\n",
-    "Connects the oracle to RL reward computation."
    ]
   },
   {
@@ -140,27 +166,40 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "hook = RewardHook(oracle, ledger, broker, mode=\"code\", agent_id=\"rl_agent\")\n",
     "\n",
     "prompts = [\"def add(a, b):\\n    return\"] * 3\n",
     "completions = [\"a + b\", \"a * b\", \"a + b + 0\"]\n",
-    "oracle_inputs = [\n",
-    "    {\"action\": {}, \"context\": {}, \"result\": {\"passed\": True, \"hidden_passed\": True, \"compute_cost\": 5}, \"task_id\": \"t1\", \"action_id\": \"a1\"},\n",
-    "    {\"action\": {}, \"context\": {}, \"result\": {\"passed\": False, \"hidden_passed\": False, \"compute_cost\": 5}, \"task_id\": \"t1\", \"action_id\": \"a2\"},\n",
-    "    {\"action\": {}, \"context\": {}, \"result\": {\"passed\": True, \"hidden_passed\": True, \"compute_cost\": 5}, \"task_id\": \"t1\", \"action_id\": \"a3\"},\n",
-    "]\n",
     "\n",
-    "rewards = hook.compute_rewards(prompts, completions, oracle_inputs)\n",
-    "print(\"Rewards:\", rewards)"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "## 5. Code Benchmark\n",
     "\n",
-    "Run the compute allocation benchmark."
    ]
   },
   {
@@ -171,21 +210,53 @@
    "source": [
     "from benchmarks.benchmark_code import CodeBenchmark\n",
     "\n",
-    "bench = CodeBenchmark(max_problems=50, seed=42)\n",
-    "bench.load_data()\n",
     "results = bench.run_all()\n",
     "\n",
     "for label, res in results.items():\n",
-    "    print(f\"{label:20s}: pass@1={res['pass@1']:.3f}, compute/problem={res['compute_per_problem']:.0f}\")"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "## 6. Ablation Study\n",
     "\n",
-    "Compare OCC with ablated configurations."
    ]
   },
   {
@@ -197,10 +268,14 @@
     "from eval_runner import AblationRunner\n",
     "\n",
     "runner = AblationRunner(seed=42)\n",
-    "code_ablations = runner.ablation_code()\n",
     "\n",
-    "for k, v in code_ablations.items():\n",
-    "    print(f\"{k:20s}: pass@1={v.get('pass@1', 'N/A'):.3f}, compute={v.get('total_compute', 'N/A'):.0f}\")"
    ]
   }
  ],
@@ -217,4 +292,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}

    "source": [
     "# OCC Stack Walkthrough\n",
     "\n",
+    "This notebook demonstrates the Oracle-Credit-Compute (OCC) stack for agentic compute allocation.\n",
+    "\n",
+    "**Repository:** https://huggingface.co/narcolepticchicken/occ-stack"
    ]
   },
   {
     "from oracle.oracle import ImpactOracle\n",
     "from ledger.ledger import CreditLedger\n",
     "from broker.broker import ResourceBroker, Decision\n",
+    "from rl.reward import RewardHook, OfflinePolicyComparator"
    ]
   },
   {
    "source": [
     "## 1. Impact Oracle\n",
     "\n",
+    "The oracle scores whether an action produced measurable marginal value.\n",
+    "Modes: `code`, `retrieval_qa`, `debate`"
    ]
   },
   {
    "source": [
     "oracle = ImpactOracle(compute_budget=1e5)\n",
     "\n",
+    "# Score a code attempt that passes hidden tests\n",
     "result = oracle.score(\n",
     "    mode=\"code\",\n",
+    "    action={\"attempt\": 1},\n",
+    "    context={\"difficulty\": 0.5},\n",
+    "    result={\"correctness\": 1.0, \"pass_at_k\": 1.0, \"regression\": False, \"compute_cost\": 50.0, \"public_pass\": True, \"hidden_tests_pass\": True},\n",
     "    agent_id=\"agent_1\"\n",
     ")\n",
+    "print(f\"Raw score: {result.raw_score:.3f}\")\n",
+    "print(f\"Cost-adjusted: {result.cost_adjusted_score:.3f}\")\n",
+    "print(f\"Reward: {result.reward_value:.3f}\")\n",
+    "print(f\"Reason: {result.reason}\")\n",
+    "print(f\"Failure tags: {result.failure_tags}\")"
    ]
   },
   {
    "source": [
     "## 2. Credit Ledger\n",
     "\n",
+    "Credits are **non-transferable**, **decaying**, and **capability-scoped**."
    ]
   },
   {
    "source": [
     "ledger = CreditLedger(decay_lambda=0.05)\n",
     "\n",
+    "# Agent earns credits for a successful action\n",
     "ledger.earn(\n",
     "    agent_id=\"agent_1\",\n",
     "    task_id=\"task_1\",\n",
     "    amount=10.0,\n",
     "    oracle_score=1.0,\n",
     "    compute_cost=50.0,\n",
+    "    reason=\"pass_hidden_test\",\n",
+    "    capability_scope=\"model_call\"\n",
     ")\n",
+    "print(f\"Balance after earn: {ledger.balance('agent_1', 'model_call', 'global'):.2f}\")\n",
     "\n",
+    "# Try to transfer (blocked by design)\n",
     "success = ledger.transfer(\"agent_1\", \"agent_2\", 5.0)\n",
     "print(f\"Transfer succeeded: {success}\")\n",
     "\n",
     "# Spend credits\n",
+    "ok = ledger.spend(\"agent_1\", \"task_1\", \"retrieval_call\", 3.0, capability_scope=\"model_call\", reason=\"retrieval\")\n",
+    "print(f\"Spend succeeded: {ok}, remaining: {ledger.balance('agent_1', 'model_call', 'global'):.2f}\")\n",
+    "\n",
+    "# Provenance\n",
+    "entries = ledger.provenance(\"agent_1\")\n",
+    "for e in entries:\n",
+    "    print(f\"  {e.reason}: earn={e.earned_credit:.1f}, spend={e.spent_credit:.1f}, balance={e.remaining_credit:.1f}\")"
    ]
   },
   {
     "broker = ResourceBroker()\n",
     "\n",
     "# Low credit -> deny\n",
+    "dec = broker.request(\"model_call\", \"agent_1\", 1.0)\n",
     "print(f\"Low credit: {dec.decision.value} - {dec.reason}\")\n",
     "\n",
+    "# High credit -> allow\n",
+    "dec = broker.request(\"model_call\", \"agent_1\", 50.0)\n",
     "print(f\"High credit: {dec.decision.value} - {dec.reason}\")\n",
     "\n",
+    "# High-risk with gaming flags -> deny\n",
+    "dec = broker.request(\"file_write\", \"agent_1\", 100.0, gaming_flags=[\"confidence_manipulation\"])\n",
+    "print(f\"Gaming flagged: {dec.decision.value} - {dec.reason}\")\n",
+    "\n",
+    "# List allowed capabilities\n",
+    "allowed = broker.get_allowed_capabilities(\"agent_1\", 50.0)\n",
+    "print(f\"Allowed capabilities: {allowed}\")"
    ]
   },
   {
    "source": [
     "## 4. GRPO Reward Hook\n",
     "\n",
+    "Connects the oracle to RL reward computation.\n",
+    "\n",
+    "Usage with TRL:\n",
+    "```python\n",
+    "from grpo_hook import make_occ_reward_func\n",
+    "from trl import GRPOTrainer\n",
+    "\n",
+    "reward_fn = make_occ_reward_func(mode='code', compute_budget=1e5)\n",
+    "trainer = GRPOTrainer(\n",
+    "    model='Qwen/Qwen2.5-0.5B-Instruct',\n",
+    "    reward_funcs=reward_fn,\n",
+    "    train_dataset=ds,\n",
+    ")\n",
+    "```"
    ]
   },
   {
    "metadata": {},
    "outputs": [],
    "source": [
+    "hook = RewardHook(oracle=oracle, mode=\"code\")\n",
     "\n",
     "prompts = [\"def add(a, b):\\n    return\"] * 3\n",
     "completions = [\"a + b\", \"a * b\", \"a + b + 0\"]\n",
+    "answers = [\"a + b\", \"a * b\", \"a + b + 0\"]\n",
+    "gold_answers = [\"a + b\"] * 3\n",
+    "confidences = [0.9, 0.9, 0.6]\n",
+    "compute_costs = [5.0, 5.0, 8.0]\n",
     "\n",
+    "rewards = hook.compute_rewards(\n",
+    "    prompts=prompts,\n",
+    "    completions=completions,\n",
+    "    answers=answers,\n",
+    "    gold_answers=gold_answers,\n",
+    "    confidences=confidences,\n",
+    "    compute_costs=compute_costs,\n",
+    ")\n",
+    "print(\"Rewards:\", rewards)\n",
+    "\n",
+    "# Offline comparison of two policies\n",
+    "comparator = OfflinePolicyComparator(reward_hook=hook)\n",
+    "policy_a = [{\"reward\": 0.5 + i*0.02, \"failure_tags\": []} for i in range(10)]\n",
+    "policy_b = [{\"reward\": 0.4 + i*0.01, \"failure_tags\": []} for i in range(10)]\n",
+    "result = comparator.compare(policy_a, policy_b)\n",
+    "print(result)"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "## 5. Code Benchmark (Simulated)\n",
     "\n",
+    "Run the compute allocation benchmark with tiered agents."
    ]
   },
   {
    "source": [
     "from benchmarks.benchmark_code import CodeBenchmark\n",
     "\n",
+    "bench = CodeBenchmark(n_problems=50, seed=42)\n",
     "results = bench.run_all()\n",
     "\n",
+    "print(f\"{'Strategy':<25} {'pass@1':>8} {'Hidden':>8} {'Compute':>10} {'Savings':>8}\")\n",
     "for label, res in results.items():\n",
+    "    p1 = res.get('pass_at_1', 0.0)\n",
+    "    hid = res.get('hidden_pass', 0.0)\n",
+    "    comp = res.get('total_compute', 0.0)\n",
+    "    sav = res.get('compute_savings', None)\n",
+    "    sav_str = f\"{sav:.1%}\" if sav is not None else \"-\"\n",
+    "    print(f\"{label:<25} {p1:>8.3f} {hid:>8.3f} {comp:>10.0f} {sav_str:>8}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 6. Debate Benchmark v2 (Adversarial Agents)\n",
+    "\n",
+    "Run multi-agent debate with variable-cost agents and adversarial participants."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from benchmarks.benchmark_debate_v2 import DebateBenchmarkV2\n",
+    "\n",
+    "bench = DebateBenchmarkV2(n_topics=50, n_agents=5, adversarial_fraction=0.4, seed=42)\n",
+    "bench.generate_topics()\n",
+    "results = bench.run_all()\n",
+    "\n",
+    "print(f\"{'Strategy':<25} {'Acc':>6} {'Comp/T':>8} {'Turns':>6} {'AdvT':>6} {'Contain':>8}\")\n",
+    "for key in ['A_equal_turns', 'B_majority_vote', 'C_confidence_weighted', 'E_occ', 'F_occ_no_decay']:\n",
+    "    r = results[key]\n",
+    "    print(f\"{r['label']:<25} {r['accuracy']:>6.3f} {r['mean_compute_per_topic']:>8.0f} {r['mean_turns']:>6.1f} {r['mean_adv_turns']:>6.1f} {r['bad_agent_containment']:>8.2f}\")"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "## 7. Anti-Gaming Tests\n",
     "\n",
+    "Test the credit system against adversarial attacks."
    ]
   },
   {
     "from eval_runner import AblationRunner\n",
     "\n",
     "runner = AblationRunner(seed=42)\n",
+    "anti = runner.anti_gaming_tests()\n",
     "\n",
+    "for k, v in anti.items():\n",
+    "    if 'accuracy' in v:\n",
+    "        print(f\"{k:25s}: acc={v['accuracy']:.3f}, compute={v.get('total_compute', 'N/A')}\")\n",
+    "    elif 'pass_at_1' in v or 'pass@1' in v:\n",
+    "        p1 = v.get('pass_at_1', v.get('pass@1', 'N/A'))\n",
+    "        print(f\"{k:25s}: pass@1={p1:.3f}, compute={v.get('total_compute', 'N/A')}\")"
    ]
   }
  ],
  },
  "nbformat": 4,
  "nbformat_minor": 4
+}