Spaces:

visualisable-ai
/

api

Paused

gary-boon Claude commited on Nov 18, 2025

Commit

f5ba954

1 Parent(s): 9e9dc34

Fix research attention endpoint model compatibility

Make QKV hook registration more robust to support different model
architectures (CodeGen vs GPT-2 style attention modules)

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>

Files changed (1) hide show

backend/model_service.py +14 -4

backend/model_service.py CHANGED Viewed

@@ -1327,10 +1327,20 @@ async def analyze_research_attention(request: Dict[str, Any], authenticated: boo
                 }
             return hook
-        # Register hooks on all qkv_proj modules
-        for layer_idx, layer in enumerate(manager.model.transformer.h):
-            hook = layer.attn.qkv_proj.register_forward_hook(make_qkv_hook(layer_idx))
-            hooks.append(hook)
         with torch.no_grad():
             current_ids = inputs["input_ids"]

                 }
             return hook
+        # Register hooks on all qkv_proj modules (if available)
+        # This is model-specific - CodeGen uses different architecture
+        try:
+            if hasattr(manager.model, 'transformer') and hasattr(manager.model.transformer, 'h'):
+                for layer_idx, layer in enumerate(manager.model.transformer.h):
+                    if hasattr(layer, 'attn') and hasattr(layer.attn, 'qkv_proj'):
+                        hook = layer.attn.qkv_proj.register_forward_hook(make_qkv_hook(layer_idx))
+                        hooks.append(hook)
+                    elif hasattr(layer, 'attn') and hasattr(layer.attn, 'c_attn'):
+                        # GPT-2 style attention
+                        hook = layer.attn.c_attn.register_forward_hook(make_qkv_hook(layer_idx))
+                        hooks.append(hook)
+        except Exception as hook_error:
+            logger.warning(f"Could not register QKV hooks: {hook_error}")
         with torch.no_grad():
             current_ids = inputs["input_ids"]