Spaces:

shiva9876
/

code_gen_backend

Sleeping

App Files Files Community

shiva9876 commited on Nov 28, 2025

Commit

59da258

verified ·

1 Parent(s): 8c06638

Upload app.py

Browse files

Files changed (1) hide show

app.py +337 -0

app.py ADDED Viewed

	@@ -0,0 +1,337 @@

+import os
+import time
+import uuid
+import requests
+import re
+from fastapi import FastAPI, HTTPException, Request
+from pydantic import BaseModel, Field
+from fastapi.middleware.cors import CORSMiddleware
+from functools import lru_cache
+from typing import Optional, Dict, Any, List
+from dotenv import load_dotenv
+# Load .env automatically from the project directory
+load_dotenv()
+# Read API key from environment
+GROQ_API_KEY = os.getenv("GROQ_API_KEY")
+# Hardcoded configuration
+GROQ_MODEL = "moonshotai/kimi-k2-instruct-0905"  # Default Groq model
+MAX_TOKENS = 2000
+TEMPERATURE = 0.5
+# Debugging: Check if API key is loaded
+if not GROQ_API_KEY:
+    print("❌ GROQ_API_KEY is not set. Check your .env file or environment variables.")
+else:
+    print(f"✅ GROQ_API_KEY Loaded: {GROQ_API_KEY[:10]}******")  # Masked for security
+print(f"📦 GROQ_MODEL Loaded: {GROQ_MODEL}")
+print(f"⚙️ Using parameters: MAX_TOKENS={MAX_TOKENS}, TEMPERATURE={TEMPERATURE}")
+# Initialize FastAPI app
+app = FastAPI(
+    title="Code Generation API with Groq",
+    description="API for generating code and explanations using Groq's LLM models",
+    version="1.0.0"
+)
+# Enable CORS for frontend communication
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # Update this with frontend domain in production
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# In-memory conversation history (use Redis/DB for production)
+conversation_history: Dict[str, List[Dict[str, str]]] = {}
+# Define request formats
+class PromptRequest(BaseModel):
+    prompt: str = Field(..., description="The user's prompt or question")
+    session_id: Optional[str] = Field(None, description="Session ID for conversation history")
+    response_type: Optional[str] = Field("both", description="Type of response: 'code', 'explanation', or 'both'")
+class HistoryRequest(BaseModel):
+    session_id: str = Field(..., description="Session ID to retrieve or clear history")
+def classify_message(message: str) -> str:
+    """Classify whether the message is conversational or code-related."""
+    # Convert message to lowercase for comparison
+    message_lower = message.lower().strip()
+    # List of common conversational greetings and phrases
+    conversational_phrases = [
+        "hi", "hello", "hey", "hi there", "hello there", "hey there",
+        "how are you", "good morning", "good afternoon", "good evening",
+        "what's up", "how's it going", "nice to meet you", "bye", "goodbye",
+        "thank you", "thanks", "ok", "okay", "yes", "no", "maybe",
+        "help", "who are you", "what can you do", "what are you",
+        "tell me about yourself"
+    ]
+    # Check if the message is a question or conversation
+    if any(message_lower.startswith(phrase) for phrase in conversational_phrases) or \
+            any(phrase in message_lower for phrase in conversational_phrases[:10]) or \
+            (message_lower.endswith("?") and len(message_lower.split()) <= 8):
+        return "conversation"
+    # Check for code-related keywords
+    code_keywords = ["code", "function", "script", "program", "algorithm", "implement",
+                     "write", "create", "python", "javascript", "java", "c++"]
+    if any(keyword in message_lower for keyword in code_keywords):
+        return "code"
+    # If in doubt, treat as conversation
+    return "conversation"
+# API call function with retry and improved error handling
+def generate_response_groq(messages: List[Dict[str, str]]) -> str:
+    """Sends messages to Groq API and returns the generated response."""
+    if not GROQ_API_KEY:
+        raise HTTPException(status_code=500, detail="GROQ_API_KEY is missing.")
+    url = "https://api.groq.com/openai/v1/chat/completions"
+    headers = {
+        "Authorization": f"Bearer {GROQ_API_KEY}",
+        "Content-Type": "application/json"
+    }
+    payload = {
+        "model": GROQ_MODEL,
+        "messages": messages,
+        "temperature": TEMPERATURE,
+        "max_tokens": MAX_TOKENS,
+    }
+    for attempt in range(3):  # Retry logic
+        try:
+            print(f"🔄 Attempt {attempt + 1} - Sending request to Groq API")
+            response = requests.post(url, headers=headers, json=payload, timeout=60)
+            print(f"📊 Status Code: {response.status_code}")
+            if response.status_code == 200:
+                result = response.json()
+                if "choices" in result and len(result["choices"]) > 0:
+                    generated_text = result["choices"][0]["message"]["content"]
+                    return generated_text
+                return "No response generated"
+            elif response.status_code == 401:  # Unauthorized (Invalid API key)
+                print("❌ Authentication error: Invalid API Key")
+                raise HTTPException(status_code=401, detail="Invalid API Key. Check your GROQ_API_KEY.")
+            elif response.status_code == 429:  # Rate limit error
+                print("⚠️ Rate limited, retrying...")
+                time.sleep(2 ** attempt)  # Exponential backoff
+                continue
+            elif response.status_code == 503:  # Service unavailable
+                print("⚠️ Service unavailable, retrying...")
+                time.sleep(2 ** attempt)
+                continue
+            else:
+                error_detail = "Unknown error"
+                try:
+                    error_data = response.json()
+                    error_detail = error_data.get("error", {}).get("message", str(error_data))
+                except:
+                    error_detail = response.text
+                print(f"❌ API Error: {error_detail}")
+                if attempt == 2:  # Last attempt
+                    raise HTTPException(status_code=response.status_code,
+                                        detail=f"Groq API Error: {error_detail}")
+        except requests.exceptions.Timeout:
+            print("⚠️ Request timed out, retrying...")
+            if attempt == 2:  # Last attempt
+                raise HTTPException(status_code=504, detail="Request timed out")
+        except requests.exceptions.ConnectionError:
+            print("⚠️ Connection error, retrying...")
+            if attempt == 2:  # Last attempt
+                raise HTTPException(status_code=503, detail="Could not connect to Groq API")
+        except Exception as e:
+            print(f"❌ Unexpected error: {str(e)}")
+            if attempt == 2:  # Last attempt
+                raise HTTPException(status_code=500, detail=f"Unexpected error: {str(e)}")
+        # Wait before retry (except on last attempt)
+        if attempt < 2:
+            time.sleep(2 ** attempt)
+    raise HTTPException(status_code=500, detail="Failed to get response after multiple attempts")
+# Helper function to process and format the model's response
+def process_response(raw_response: str, response_type: str) -> Dict[str, Any]:
+    """Process and format the model's response based on the requested type."""
+    # For conversational responses, don't try to extract code
+    if response_type == "conversation":
+        return {"response": raw_response}
+    elif response_type == "code":
+        # Extract code blocks with regex
+        code_match = re.search(r"```(?:python|javascript|java|cpp|c\+\+)?\n(.*?)\n```", raw_response, re.DOTALL)
+        if code_match:
+            return {"generated_code": code_match.group(1).strip()}
+        # If no code block found, return the whole response as code
+        return {"generated_code": raw_response}
+    elif response_type == "explanation":
+        # Remove code blocks
+        explanation = re.sub(r"```(?:\w+)?\n.*?\n```", "", raw_response, flags=re.DOTALL).strip()
+        return {"explanation": explanation}
+    else:  # "both"
+        code = None
+        explanation = raw_response
+        # Extract code blocks
+        code_match = re.search(r"```(?:python|javascript|java|cpp|c\+\+)?\n(.*?)\n```", raw_response, re.DOTALL)
+        if code_match:
+            code = code_match.group(1).strip()
+            # Remove code blocks from explanation
+            explanation = re.sub(r"```(?:\w+)?\n.*?\n```", "", raw_response, flags=re.DOTALL).strip()
+        return {
+            "response": raw_response,
+            "generated_code": code,
+            "explanation": explanation
+        }
+# API route for generating responses
+@app.post("/generate/")
+async def generate_response(request: PromptRequest):
+    """Handles incoming user requests, maintains session history, and calls Groq model."""
+    try:
+        session_id = request.session_id or str(uuid.uuid4())
+        if session_id not in conversation_history:
+            conversation_history[session_id] = []
+        # Classify the message type first
+        message_type = classify_message(request.prompt)
+        # Build messages array for Groq API (OpenAI format)
+        messages = []
+        # Add system message based on response type
+        if message_type == "conversation":
+            system_prompt = "You are a helpful and friendly AI assistant. Engage in natural conversation and answer questions clearly."
+        else:
+            if request.response_type == "code":
+                system_prompt = "You are an expert programmer. Provide clean, efficient code solutions. Always wrap code in markdown code blocks with the appropriate language tag."
+            elif request.response_type == "explanation":
+                system_prompt = "You are a programming tutor. Explain programming concepts clearly without providing code. Focus on the approach and logic."
+            else:  # both
+                system_prompt = "You are an expert programmer and teacher. Provide clear explanations followed by well-commented code examples. Always wrap code in markdown code blocks."
+        messages.append({"role": "system", "content": system_prompt})
+        # Add conversation history (last 6 messages to keep context manageable)
+        if conversation_history[session_id]:
+            for msg in conversation_history[session_id][-6:]:
+                messages.append(msg)
+        # Add current user message
+        messages.append({"role": "user", "content": request.prompt})
+        # Get response from Groq model
+        print(f"📤 Sending {len(messages)} messages to Groq...")
+        generated_response = generate_response_groq(messages)
+        print(f"✅ Received response of length: {len(generated_response)}")
+        # Store conversation history in OpenAI message format
+        conversation_history[session_id].append({"role": "user", "content": request.prompt})
+        conversation_history[session_id].append({"role": "assistant", "content": generated_response})
+        # Limit history size to prevent memory issues (keep last 20 messages = 10 exchanges)
+        if len(conversation_history[session_id]) > 20:
+            conversation_history[session_id] = conversation_history[session_id][-20:]
+        # For conversational messages, return directly without code/explanation processing
+        if message_type == "conversation":
+            response_data = {
+                "response": generated_response,
+                "message_type": "conversation"
+            }
+        else:
+            # Handle response type and build response data for code-related messages
+            response_data = process_response(generated_response, request.response_type)
+            response_data["message_type"] = "code"
+        response_data["session_id"] = session_id
+        return response_data
+    except HTTPException as e:
+        # Re-raise HTTP exceptions to maintain status codes
+        raise
+    except Exception as e:
+        print(f"❌ Unexpected error in generate_response: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"Unexpected error: {str(e)}")
+# API route for clearing conversation history
+@app.post("/clear_history/")
+async def clear_history(request: HistoryRequest):
+    """Clears conversation history for a given session."""
+    if request.session_id in conversation_history:
+        conversation_history[request.session_id] = []
+        return {"status": "success", "message": "Conversation history cleared"}
+    return {"status": "not_found", "message": "Session ID not found"}
+# API route for getting conversation history
+@app.post("/get_history/")
+async def get_history(request: HistoryRequest):
+    """Gets conversation history for a given session."""
+    if request.session_id in conversation_history:
+        return {
+            "status": "success",
+            "history": conversation_history[request.session_id]
+        }
+    return {"status": "not_found", "message": "Session ID not found"}
+# Health check endpoint
+@app.get("/")
+@app.get("/health")
+async def health_check():
+    """Health check endpoint to verify the API is running."""
+    return {
+        "status": "ok",
+        "service": "Groq Code Generation API",
+        "model": GROQ_MODEL,
+        "version": "1.0.0"
+    }
+# Request logging middleware for debugging
+@app.middleware("http")
+async def log_requests(request: Request, call_next):
+    """Log all incoming requests for debugging."""
+    start_time = time.time()
+    response = await call_next(request)
+    process_time = time.time() - start_time
+    print(f"📝 {request.method} {request.url.path} → Status: {response.status_code} ({process_time:.2f}s)")
+    return response
+if __name__ == "__main__":
+    import uvicorn
+    port = int(os.getenv("PORT", "7860"))  # Hugging Face Spaces uses port 7860
+    uvicorn.run(app, host="0.0.0.0", port=port)