Spaces:

DD009
/

THISverse

Sleeping

App Files Files Community

DD009 commited on Nov 21, 2025

Commit

4af38ee

verified ·

1 Parent(s): dce0034

Upload main.py

Browse files

Files changed (1) hide show

src/main.py +845 -0

src/main.py ADDED Viewed

	@@ -0,0 +1,845 @@

+"""
+Developer Productivity Agent
+RAG-based system using Pinecone for vector storage and GPT-4o-mini.
+Features:
+- Pinecone vector database (2GB free tier)
+- Divided LLM Architecture for cost optimization
+- Real-time cost tracking and analytics
+- OpenAI embeddings (text-embedding-3-small)
+"""
+import os
+import json
+import time
+from pathlib import Path
+from typing import List, Dict, Any, Optional
+import hashlib
+from datetime import datetime
+# Core dependencies
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+import uvicorn
+# Vector database - Pinecone
+from pinecone import Pinecone, ServerlessSpec
+# LLM client
+from openai import OpenAI
+# Code parsing
+import ast
+import re
+from dataclasses import dataclass, field
+# ============================================================================
+# Configuration
+# ============================================================================
+class Config:
+    """Application configuration"""
+    # OpenAI
+    OPENAI_API_KEY = os.getenv("OPENAI_API_KEY", "")
+    # Pinecone
+    PINECONE_API_KEY = os.getenv("PINECONE_API_KEY", "")
+    PINECONE_INDEX_NAME = os.getenv("PINECONE_INDEX_NAME", "codebase-index")
+    PINECONE_CLOUD = "aws"
+    PINECONE_REGION = "us-east-1"
+    # Models
+    ARCHITECT_MODEL = "gpt-4o-mini"
+    DEVELOPER_MODEL = "gpt-4o-mini"
+    EMBEDDING_MODEL = "text-embedding-3-small"
+    EMBEDDING_DIM = 1536
+    # Chunking
+    CHUNK_SIZE = 1500
+    CHUNK_OVERLAP = 200
+    TOP_K_RESULTS = 10
+    # Cost tracking (per 1M tokens)
+    COST_GPT4O_MINI_INPUT = 0.15  # $0.15 per 1M input tokens
+    COST_GPT4O_MINI_OUTPUT = 0.60  # $0.60 per 1M output tokens
+    COST_EMBEDDING = 0.02  # $0.02 per 1M tokens
+    COST_GPT4_INPUT = 30.0  # For comparison - traditional approach
+    COST_GPT4_OUTPUT = 60.0
+# ============================================================================
+# Cost Tracker
+# ============================================================================
+class CostTracker:
+    """Tracks API costs and calculates savings"""
+    def __init__(self):
+        self.reset()
+    def reset(self):
+        """Reset all counters"""
+        self.embedding_tokens = 0
+        self.architect_input_tokens = 0
+        self.architect_output_tokens = 0
+        self.developer_input_tokens = 0
+        self.developer_output_tokens = 0
+        self.api_calls = 0
+        self.tickets_processed = 0
+        self.questions_answered = 0
+        self.start_time = datetime.now()
+        self.history = []
+    def add_embedding(self, tokens: int):
+        """Track embedding tokens"""
+        self.embedding_tokens += tokens
+        self.api_calls += 1
+    def add_architect_call(self, input_tokens: int, output_tokens: int):
+        """Track architect LLM call"""
+        self.architect_input_tokens += input_tokens
+        self.architect_output_tokens += output_tokens
+        self.api_calls += 1
+    def add_developer_call(self, input_tokens: int, output_tokens: int):
+        """Track developer LLM call"""
+        self.developer_input_tokens += input_tokens
+        self.developer_output_tokens += output_tokens
+        self.api_calls += 1
+    def record_ticket(self):
+        """Record a processed ticket"""
+        self.tickets_processed += 1
+        self._add_to_history("ticket")
+    def record_question(self):
+        """Record an answered question"""
+        self.questions_answered += 1
+        self._add_to_history("question")
+    def _add_to_history(self, event_type: str):
+        """Add event to history"""
+        self.history.append({
+            "timestamp": datetime.now().isoformat(),
+            "type": event_type,
+            "cumulative_cost": self.get_actual_cost(),
+            "cumulative_savings": self.get_savings()
+        })
+    def get_actual_cost(self) -> float:
+        """Calculate actual cost with our approach"""
+        config = Config()
+        embedding_cost = (self.embedding_tokens / 1_000_000) * config.COST_EMBEDDING
+        architect_cost = (
+            (self.architect_input_tokens / 1_000_000) * config.COST_GPT4O_MINI_INPUT +
+            (self.architect_output_tokens / 1_000_000) * config.COST_GPT4O_MINI_OUTPUT
+        )
+        developer_cost = (
+            (self.developer_input_tokens / 1_000_000) * config.COST_GPT4O_MINI_INPUT +
+            (self.developer_output_tokens / 1_000_000) * config.COST_GPT4O_MINI_OUTPUT
+        )
+        return embedding_cost + architect_cost + developer_cost
+    def get_traditional_cost(self) -> float:
+        """Calculate what it would cost with traditional GPT-4 approach"""
+        config = Config()
+        # Traditional approach uses GPT-4 for everything
+        total_input = self.architect_input_tokens + self.developer_input_tokens
+        total_output = self.architect_output_tokens + self.developer_output_tokens
+        return (
+            (total_input / 1_000_000) * config.COST_GPT4_INPUT +
+            (total_output / 1_000_000) * config.COST_GPT4_OUTPUT
+        )
+    def get_savings(self) -> float:
+        """Calculate cost savings"""
+        return self.get_traditional_cost() - self.get_actual_cost()
+    def get_savings_percentage(self) -> float:
+        """Calculate savings as percentage"""
+        traditional = self.get_traditional_cost()
+        if traditional == 0:
+            return 0
+        return ((traditional - self.get_actual_cost()) / traditional) * 100
+    def get_stats(self) -> Dict[str, Any]:
+        """Get comprehensive statistics"""
+        return {
+            "actual_cost": round(self.get_actual_cost(), 6),
+            "traditional_cost": round(self.get_traditional_cost(), 6),
+            "savings": round(self.get_savings(), 6),
+            "savings_percentage": round(self.get_savings_percentage(), 2),
+            "total_tokens": {
+                "embedding": self.embedding_tokens,
+                "architect_input": self.architect_input_tokens,
+                "architect_output": self.architect_output_tokens,
+                "developer_input": self.developer_input_tokens,
+                "developer_output": self.developer_output_tokens,
+                "total": (self.embedding_tokens + self.architect_input_tokens +
+                         self.architect_output_tokens + self.developer_input_tokens +
+                         self.developer_output_tokens)
+            },
+            "api_calls": self.api_calls,
+            "tickets_processed": self.tickets_processed,
+            "questions_answered": self.questions_answered,
+            "session_duration_minutes": round((datetime.now() - self.start_time).seconds / 60, 2),
+            "cost_per_ticket": round(self.get_actual_cost() / max(self.tickets_processed, 1), 6),
+            "history": self.history[-50:]  # Last 50 events
+        }
+# Global cost tracker
+cost_tracker = CostTracker()
+# ============================================================================
+# Data Models
+# ============================================================================
+class JiraTicket(BaseModel):
+    ticket_id: str
+    title: str
+    description: str
+    acceptance_criteria: Optional[str] = None
+    labels: Optional[List[str]] = None
+class ImplementationPlan(BaseModel):
+    ticket_summary: str
+    key_entities: List[str]
+    relevant_files: List[Dict[str, str]]
+    implementation_steps: List[str]
+    prerequisites: List[str]
+    boilerplate_code: Dict[str, str]
+    architecture_notes: str
+    estimated_complexity: str
+# ============================================================================
+# Pinecone-based Codebase Indexer
+# ============================================================================
+class CodebaseIndexer:
+    """Indexes codebase into Pinecone vector database"""
+    def __init__(self, config: Config):
+        self.config = config
+        self._openai_client = None
+        self._pinecone_client = None
+        self._index = None
+    @property
+    def openai_client(self):
+        if self._openai_client is None:
+            if not self.config.OPENAI_API_KEY:
+                raise ValueError("OpenAI API key required")
+            self._openai_client = OpenAI(api_key=self.config.OPENAI_API_KEY)
+        return self._openai_client
+    @property
+    def index(self):
+        if self._index is None:
+            if not self.config.PINECONE_API_KEY:
+                raise ValueError("Pinecone API key required")
+            # Initialize Pinecone
+            pc = Pinecone(api_key=self.config.PINECONE_API_KEY)
+            # Create index if not exists
+            if self.config.PINECONE_INDEX_NAME not in pc.list_indexes().names():
+                pc.create_index(
+                    name=self.config.PINECONE_INDEX_NAME,
+                    dimension=self.config.EMBEDDING_DIM,
+                    metric="cosine",
+                    spec=ServerlessSpec(
+                        cloud=self.config.PINECONE_CLOUD,
+                        region=self.config.PINECONE_REGION
+                    )
+                )
+                # Wait for index to be ready
+                time.sleep(5)
+            self._index = pc.Index(self.config.PINECONE_INDEX_NAME)
+            print(f"📂 Pinecone index ready: {self.config.PINECONE_INDEX_NAME}")
+        return self._index
+    def _get_embedding(self, text: str) -> List[float]:
+        """Get embedding and track cost"""
+        # Estimate tokens (rough: 1 token ≈ 4 chars)
+        tokens = len(text) // 4
+        cost_tracker.add_embedding(tokens)
+        response = self.openai_client.embeddings.create(
+            model=self.config.EMBEDDING_MODEL,
+            input=text
+        )
+        return response.data[0].embedding
+    def _get_embeddings_batch(self, texts: List[str]) -> List[List[float]]:
+        """Batch embeddings with cost tracking"""
+        if not texts:
+            return []
+        tokens = sum(len(t) // 4 for t in texts)
+        cost_tracker.add_embedding(tokens)
+        response = self.openai_client.embeddings.create(
+            model=self.config.EMBEDDING_MODEL,
+            input=texts
+        )
+        return [item.embedding for item in response.data]
+    def _detect_language(self, file_path: str) -> str:
+        ext_map = {
+            '.py': 'python', '.js': 'javascript', '.jsx': 'javascript',
+            '.ts': 'typescript', '.tsx': 'typescript', '.java': 'java',
+            '.go': 'go', '.rs': 'rust', '.cpp': 'cpp', '.c': 'c',
+        }
+        return ext_map.get(Path(file_path).suffix.lower(), 'unknown')
+    def _chunk_content(self, content: str, file_path: str) -> List[Dict[str, Any]]:
+        """Chunk content with overlap"""
+        chunks = []
+        lines = content.split('\n')
+        chunk_lines = self.config.CHUNK_SIZE // 50
+        overlap_lines = self.config.CHUNK_OVERLAP // 50
+        i = 0
+        chunk_idx = 0
+        while i < len(lines):
+            end = min(i + chunk_lines, len(lines))
+            chunk_content = '\n'.join(lines[i:end])
+            if chunk_content.strip():  # Skip empty chunks
+                chunks.append({
+                    'content': chunk_content,
+                    'file_path': file_path,
+                    'chunk_index': chunk_idx,
+                    'line_start': i + 1,
+                    'line_end': end,
+                    'language': self._detect_language(file_path)
+                })
+            i = end - overlap_lines if end < len(lines) else end
+            chunk_idx += 1
+        return chunks
+    def index_file(self, file_path: str, content: str) -> int:
+        """Index a single file into Pinecone"""
+        chunks = self._chunk_content(content, file_path)
+        if not chunks:
+            return 0
+        # Get embeddings
+        texts = [c['content'] for c in chunks]
+        embeddings = self._get_embeddings_batch(texts)
+        # Prepare vectors for Pinecone
+        vectors = []
+        for i, chunk in enumerate(chunks):
+            vector_id = hashlib.md5(
+                f"{file_path}_{chunk['chunk_index']}".encode()
+            ).hexdigest()
+            vectors.append({
+                "id": vector_id,
+                "values": embeddings[i],
+                "metadata": {
+                    "file_path": file_path,
+                    "chunk_index": chunk['chunk_index'],
+                    "language": chunk['language'],
+                    "line_start": chunk['line_start'],
+                    "line_end": chunk['line_end'],
+                    "content": chunk['content'][:1000]  # Pinecone metadata limit
+                }
+            })
+        # Upsert to Pinecone
+        self.index.upsert(vectors=vectors)
+        return len(chunks)
+    def index_directory(self, directory_path: str, extensions: List[str] = None) -> Dict[str, int]:
+        """Index all files in a directory"""
+        if extensions is None:
+            extensions = ['.py', '.js', '.jsx', '.ts', '.tsx', '.java', '.go']
+        results = {}
+        directory = Path(directory_path)
+        for ext in extensions:
+            for file_path in directory.rglob(f"*{ext}"):
+                if any(skip in str(file_path) for skip in ['node_modules', '__pycache__', '.git', 'venv']):
+                    continue
+                try:
+                    content = file_path.read_text(encoding='utf-8')
+                    chunks = self.index_file(str(file_path), content)
+                    results[str(file_path)] = chunks
+                    print(f"  ✅ {file_path.name}: {chunks} chunks")
+                except Exception as e:
+                    results[str(file_path)] = f"Error: {e}"
+        return results
+    def search(self, query: str, top_k: int = None) -> List[Dict[str, Any]]:
+        """Search codebase"""
+        if top_k is None:
+            top_k = self.config.TOP_K_RESULTS
+        query_embedding = self._get_embedding(query)
+        results = self.index.query(
+            vector=query_embedding,
+            top_k=top_k,
+            include_metadata=True
+        )
+        formatted = []
+        for match in results.matches:
+            formatted.append({
+                'content': match.metadata.get('content', ''),
+                'metadata': {
+                    'file_path': match.metadata.get('file_path', ''),
+                    'line_start': match.metadata.get('line_start', 0),
+                    'line_end': match.metadata.get('line_end', 0),
+                    'language': match.metadata.get('language', '')
+                },
+                'score': match.score
+            })
+        return formatted
+    def get_stats(self) -> Dict[str, Any]:
+        """Get index statistics"""
+        try:
+            stats = self.index.describe_index_stats()
+            return {
+                'total_chunks': stats.total_vector_count,
+                'index_name': self.config.PINECONE_INDEX_NAME,
+                'dimension': stats.dimension
+            }
+        except:
+            return {'total_chunks': 0, 'index_name': self.config.PINECONE_INDEX_NAME}
+    def clear_index(self):
+        """Clear all vectors"""
+        try:
+            self.index.delete(delete_all=True)
+            print("⚠️  Index cleared!")
+        except:
+            pass
+# ============================================================================
+# LLM Specialists with Cost Tracking
+# ============================================================================
+class ArchitectLLM:
+    """LLM #1: Architect - planning and analysis"""
+    def __init__(self, config: Config):
+        self.config = config
+        self._client = None
+        self.model = config.ARCHITECT_MODEL
+    @property
+    def client(self):
+        if self._client is None:
+            if not self.config.OPENAI_API_KEY:
+                raise ValueError("OpenAI API key not set!")
+            self._client = OpenAI(api_key=self.config.OPENAI_API_KEY)
+        return self._client
+    def reset_client(self):
+        self._client = None
+    def analyze_ticket(self, ticket: JiraTicket) -> Dict[str, Any]:
+        prompt = f"""Analyze this Jira ticket for implementation:
+ID: {ticket.ticket_id}
+Title: {ticket.title}
+Description: {ticket.description}
+Acceptance Criteria: {ticket.acceptance_criteria or 'Not specified'}
+Provide JSON:
+{{
+    "summary": "2-3 sentence summary",
+    "key_entities": ["entity1", "entity2"],
+    "technical_keywords": ["keyword1", "keyword2"],
+    "prerequisites": ["prereq1"],
+    "complexity": "Low/Medium/High",
+    "complexity_reason": "why",
+    "risks": ["risk1"]
+}}"""
+        response = self.client.chat.completions.create(
+            model=self.model,
+            messages=[{"role": "user", "content": prompt}],
+            temperature=0.3
+        )
+        # Track costs
+        usage = response.usage
+        cost_tracker.add_architect_call(usage.prompt_tokens, usage.completion_tokens)
+        content = response.choices[0].message.content
+        try:
+            content = re.sub(r'^```json?\s*', '', content.strip())
+            content = re.sub(r'\s*```$', '', content)
+            return json.loads(content)
+        except:
+            return {"summary": content, "key_entities": [], "technical_keywords": [],
+                   "prerequisites": [], "complexity": "Unknown", "complexity_reason": "", "risks": []}
+    def create_implementation_strategy(self, ticket_analysis: Dict, code_context: List[Dict]) -> Dict:
+        context_str = "\n".join([
+            f"File: {c['metadata'].get('file_path', '?')}\n{c['content'][:500]}"
+            for c in code_context[:5]
+        ])
+        prompt = f"""Create a detailed implementation strategy for this ticket:
+Ticket Analysis: {json.dumps(ticket_analysis, indent=2)}
+Relevant Code Context:
+{context_str}
+Provide a comprehensive JSON response with:
+{{
+    "architecture_notes": "Detailed explanation of how this feature fits into the existing architecture",
+    "implementation_steps": ["Step 1: ...", "Step 2: ...", "Step 3: ..."],
+    "files_to_modify": [
+        {{
+            "path": "relative/path/to/file.py",
+            "action": "create|modify|extend",
+            "reason": "Why this file needs to be changed",
+            "details": "Specific changes needed (functions to add, classes to modify, etc.)"
+        }}
+    ],
+    "patterns_to_follow": ["Pattern 1 from codebase", "Pattern 2 from codebase"],
+    "integration_points": ["Where this integrates with existing code"]
+}}
+Be specific about file paths, actions, and implementation details."""
+        response = self.client.chat.completions.create(
+            model=self.model,
+            messages=[{"role": "user", "content": prompt}],
+            temperature=0.3
+        )
+        usage = response.usage
+        cost_tracker.add_architect_call(usage.prompt_tokens, usage.completion_tokens)
+        content = response.choices[0].message.content
+        try:
+            content = re.sub(r'^```json?\s*', '', content.strip())
+            content = re.sub(r'\s*```$', '', content)
+            return json.loads(content)
+        except:
+            return {"architecture_notes": content, "implementation_steps": [],
+                   "files_to_modify": [], "patterns_to_follow": [], "integration_points": []}
+class DeveloperLLM:
+    """LLM #2: Developer - code generation"""
+    def __init__(self, config: Config):
+        self.config = config
+        self._client = None
+        self.model = config.DEVELOPER_MODEL
+    @property
+    def client(self):
+        if self._client is None:
+            if not self.config.OPENAI_API_KEY:
+                raise ValueError("OpenAI API key not set!")
+            self._client = OpenAI(api_key=self.config.OPENAI_API_KEY)
+        return self._client
+    def reset_client(self):
+        self._client = None
+    def generate_boilerplate(self, ticket_analysis: Dict, strategy: Dict, code_context: List[Dict]) -> Dict[str, str]:
+        # Include more context from relevant files
+        context_str = "\n".join([
+            f"// File: {c['metadata'].get('file_path', '?')}\n{c['content'][:600]}\n"
+            for c in code_context[:5]
+        ])
+        files_to_modify = strategy.get('files_to_modify', [])
+        files_info = "\n".join([
+            f"- {f.get('path', 'unknown')}: {f.get('action', 'create')} - {f.get('reason', '')}"
+            for f in files_to_modify[:10]
+        ]) if files_to_modify else "Create new files as needed"
+        patterns = strategy.get('patterns_to_follow', [])
+        patterns_str = "\n".join([f"- {p}" for p in patterns]) if patterns else "Follow existing codebase patterns"
+        prompt = f"""Generate complete, production-ready implementation code for this ticket.
+Ticket Summary: {ticket_analysis.get('summary', '')}
+Key Entities: {', '.join(ticket_analysis.get('key_entities', []))}
+Implementation Steps:
+{chr(10).join(f"{i+1}. {step}" for i, step in enumerate(strategy.get('implementation_steps', [])))}
+Files to Create/Modify:
+{files_info}
+Patterns to Follow:
+{patterns_str}
+Existing Codebase Patterns (for reference):
+{context_str}
+IMPORTANT REQUIREMENTS:
+1. Generate COMPLETE, WORKING code - NOT placeholder TODOs or comments
+2. Follow the exact patterns, structure, and style from the existing codebase
+3. Include all necessary imports, error handling, and type hints
+4. Make the code production-ready and functional
+5. For new files, include complete class/function implementations
+6. For modifications, show the complete updated code sections
+7. Use the same coding conventions, naming, and architecture as the existing code
+Respond with JSON where keys are file paths and values are complete code:
+{{"path/to/file.py": "complete working code here", "path/to/other.js": "complete working code here"}}
+Generate actual implementation code, not TODO comments."""
+        response = self.client.chat.completions.create(
+            model=self.model,
+            messages=[{"role": "user", "content": prompt}],
+            temperature=0.3,  # Slightly higher for more creative but still consistent code
+            max_tokens=4000  # Allow for longer, more complete code generation
+        )
+        usage = response.usage
+        cost_tracker.add_developer_call(usage.prompt_tokens, usage.completion_tokens)
+        content = response.choices[0].message.content
+        try:
+            # Clean up markdown code blocks
+            content = re.sub(r'^```json?\s*', '', content.strip())
+            content = re.sub(r'\s*```$', '', content)
+            code_dict = json.loads(content)
+            # Post-process: Ensure code quality and completeness
+            processed_code = {}
+            for file_path, code in code_dict.items():
+                # Check if code is mostly TODOs (more than 50% TODO lines)
+                lines = code.split('\n')
+                todo_count = sum(1 for line in lines if re.search(r'TODO:', line, re.IGNORECASE))
+                total_lines = len([l for l in lines if l.strip()])
+                if total_lines > 0 and (todo_count / total_lines) > 0.5:
+                    # Code is mostly TODOs - add a note but keep it
+                    processed_code[file_path] = f"# Note: This code contains many TODOs. Please review and implement.\n\n{code}"
+                else:
+                    # Code looks good, return as-is
+                    processed_code[file_path] = code
+            return processed_code
+        except json.JSONDecodeError:
+            # If JSON parsing fails, try to extract code blocks
+            code_blocks = re.findall(r'```(?:\w+)?\n(.*?)```', content, re.DOTALL)
+            if code_blocks:
+                return {"generated_code.txt": code_blocks[0]}
+            return {"generated_code.txt": content}
+        except Exception as e:
+            print(f"Warning: Error processing generated code: {e}")
+            return {"generated_code.txt": content}
+    def explain_code_context(self, code_context: List[Dict], question: str) -> str:
+        context_str = "\n".join([f"File: {c['metadata'].get('file_path', '?')}\n{c['content']}"
+                                  for c in code_context[:5]])
+        prompt = f"""Explain this code:
+{context_str}
+Question: {question}
+Be concise and helpful."""
+        response = self.client.chat.completions.create(
+            model=self.model,
+            messages=[{"role": "user", "content": prompt}],
+            temperature=0.3
+        )
+        usage = response.usage
+        cost_tracker.add_developer_call(usage.prompt_tokens, usage.completion_tokens)
+        return response.choices[0].message.content
+# ============================================================================
+# Main Agent
+# ============================================================================
+class DevProductivityAgent:
+    """Main orchestrator with Pinecone and cost tracking"""
+    def __init__(self, config: Config = None):
+        self.config = config or Config()
+        self.indexer = CodebaseIndexer(self.config)
+        self.architect = ArchitectLLM(self.config)
+        self.developer = DeveloperLLM(self.config)
+    def set_api_keys(self, openai_key: str = None, pinecone_key: str = None):
+        """Set API keys"""
+        if openai_key:
+            self.config.OPENAI_API_KEY = openai_key
+            self.architect.reset_client()
+            self.developer.reset_client()
+            self.indexer._openai_client = None
+        if pinecone_key:
+            self.config.PINECONE_API_KEY = pinecone_key
+            self.indexer._index = None
+    def index_codebase(self, directory: str, extensions: List[str] = None) -> Dict:
+        print(f"📂 Indexing: {directory}")
+        results = self.indexer.index_directory(directory, extensions)
+        stats = self.indexer.get_stats()
+        return {
+            "files_indexed": len([r for r in results.values() if isinstance(r, int)]),
+            "total_chunks": stats['total_chunks'],
+            "details": results
+        }
+    def process_ticket(self, ticket: JiraTicket) -> ImplementationPlan:
+        print("📋 Analyzing...")
+        analysis = self.architect.analyze_ticket(ticket)
+        print("🔍 Searching...")
+        queries = analysis.get('technical_keywords', []) + analysis.get('key_entities', [])
+        all_results = []
+        seen = set()
+        for q in queries[:5]:
+            for r in self.indexer.search(q, top_k=5):
+                fp = r['metadata'].get('file_path', '')
+                if fp not in seen:
+                    all_results.append(r)
+                    seen.add(fp)
+        print("📐 Planning...")
+        strategy = self.architect.create_implementation_strategy(analysis, all_results)
+        print("💻 Generating...")
+        code = self.developer.generate_boilerplate(analysis, strategy, all_results)
+        cost_tracker.record_ticket()
+        return ImplementationPlan(
+            ticket_summary=analysis.get('summary', ''),
+            key_entities=analysis.get('key_entities', []),
+            relevant_files=[{
+                'path': r['metadata'].get('file_path', ''),
+                'relevance': f"Lines {r['metadata'].get('line_start', '?')}-{r['metadata'].get('line_end', '?')}",
+                'preview': r['content'][:200]
+            } for r in all_results[:10]],
+            implementation_steps=strategy.get('implementation_steps', []),
+            prerequisites=analysis.get('prerequisites', []),
+            boilerplate_code=code,
+            architecture_notes=strategy.get('architecture_notes', ''),
+            estimated_complexity=analysis.get('complexity', 'Unknown')
+        )
+    def ask_about_code(self, question: str) -> str:
+        results = self.indexer.search(question)
+        if not results:
+            return "No relevant code found. Index your codebase first."
+        answer = self.developer.explain_code_context(results, question)
+        cost_tracker.record_question()
+        return answer
+    def get_cost_stats(self) -> Dict:
+        return cost_tracker.get_stats()
+    def reset_cost_tracking(self):
+        cost_tracker.reset()
+# ============================================================================
+# FastAPI
+# ============================================================================
+app = FastAPI(title="Developer Productivity Agent", version="2.0.0")
+app.add_middleware(CORSMiddleware, allow_origins=["*"], allow_credentials=True,
+                   allow_methods=["*"], allow_headers=["*"])
+agent = DevProductivityAgent()
+@app.get("/")
+async def root():
+    stats = agent.indexer.get_stats()
+    return {"status": "healthy", "vector_db": "Pinecone", "chunks": stats['total_chunks']}
+@app.get("/stats")
+async def get_stats():
+    return agent.indexer.get_stats()
+@app.get("/cost-analytics")
+async def get_cost_analytics():
+    """Get cost analytics and savings"""
+    return agent.get_cost_stats()
+@app.post("/reset-costs")
+async def reset_costs():
+    agent.reset_cost_tracking()
+    return {"status": "reset"}
+@app.post("/index")
+async def index_codebase(directory: str, extensions: List[str] = None):
+    try:
+        return {"status": "success", "results": agent.index_codebase(directory, extensions)}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/process-ticket", response_model=ImplementationPlan)
+async def process_ticket(ticket: JiraTicket):
+    try:
+        return agent.process_ticket(ticket)
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/ask")
+async def ask(question: str):
+    try:
+        return {"answer": agent.ask_about_code(question)}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/search")
+async def search(query: str, top_k: int = 10):
+    try:
+        return {"results": agent.indexer.search(query, top_k)}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.delete("/clear")
+async def clear():
+    agent.indexer.clear_index()
+    return {"status": "cleared"}
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--index", type=str)
+    parser.add_argument("--serve", action="store_true")
+    parser.add_argument("--port", type=int, default=8000)
+    args = parser.parse_args()
+    if args.index:
+        agent.index_codebase(args.index)
+    if args.serve:
+        uvicorn.run(app, host="0.0.0.0", port=args.port)