Spaces:

shiva9876
/

code_gen_backend

Sleeping

App Files Files Community

code_gen_backend / app.py

shiva9876

Upload app.py

59da258 verified 2 months ago

raw

history blame contribute delete

13.9 kB

	import os
	import time
	import uuid
	import requests
	import re
	from fastapi import FastAPI, HTTPException, Request
	from pydantic import BaseModel, Field
	from fastapi.middleware.cors import CORSMiddleware
	from functools import lru_cache
	from typing import Optional, Dict, Any, List
	from dotenv import load_dotenv

	# Load .env automatically from the project directory
	load_dotenv()

	# Read API key from environment
	GROQ_API_KEY = os.getenv("GROQ_API_KEY")

	# Hardcoded configuration
	GROQ_MODEL = "moonshotai/kimi-k2-instruct-0905" # Default Groq model
	MAX_TOKENS = 2000
	TEMPERATURE = 0.5

	# Debugging: Check if API key is loaded
	if not GROQ_API_KEY:
	print("❌ GROQ_API_KEY is not set. Check your .env file or environment variables.")
	else:
	print(f"✅ GROQ_API_KEY Loaded: {GROQ_API_KEY[:10]}******") # Masked for security

	print(f"📦 GROQ_MODEL Loaded: {GROQ_MODEL}")
	print(f"⚙️ Using parameters: MAX_TOKENS={MAX_TOKENS}, TEMPERATURE={TEMPERATURE}")

	# Initialize FastAPI app
	app = FastAPI(
	title="Code Generation API with Groq",
	description="API for generating code and explanations using Groq's LLM models",
	version="1.0.0"
	)

	# Enable CORS for frontend communication
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"], # Update this with frontend domain in production
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# In-memory conversation history (use Redis/DB for production)
	conversation_history: Dict[str, List[Dict[str, str]]] = {}


	# Define request formats
	class PromptRequest(BaseModel):
	prompt: str = Field(..., description="The user's prompt or question")
	session_id: Optional[str] = Field(None, description="Session ID for conversation history")
	response_type: Optional[str] = Field("both", description="Type of response: 'code', 'explanation', or 'both'")


	class HistoryRequest(BaseModel):
	session_id: str = Field(..., description="Session ID to retrieve or clear history")


	def classify_message(message: str) -> str:
	"""Classify whether the message is conversational or code-related."""

	# Convert message to lowercase for comparison
	message_lower = message.lower().strip()

	# List of common conversational greetings and phrases
	conversational_phrases = [
	"hi", "hello", "hey", "hi there", "hello there", "hey there",
	"how are you", "good morning", "good afternoon", "good evening",
	"what's up", "how's it going", "nice to meet you", "bye", "goodbye",
	"thank you", "thanks", "ok", "okay", "yes", "no", "maybe",
	"help", "who are you", "what can you do", "what are you",
	"tell me about yourself"
	]

	# Check if the message is a question or conversation
	if any(message_lower.startswith(phrase) for phrase in conversational_phrases) or \
	any(phrase in message_lower for phrase in conversational_phrases[:10]) or \
	(message_lower.endswith("?") and len(message_lower.split()) <= 8):
	return "conversation"

	# Check for code-related keywords
	code_keywords = ["code", "function", "script", "program", "algorithm", "implement",
	"write", "create", "python", "javascript", "java", "c++"]

	if any(keyword in message_lower for keyword in code_keywords):
	return "code"

	# If in doubt, treat as conversation
	return "conversation"


	# API call function with retry and improved error handling
	def generate_response_groq(messages: List[Dict[str, str]]) -> str:
	"""Sends messages to Groq API and returns the generated response."""
	if not GROQ_API_KEY:
	raise HTTPException(status_code=500, detail="GROQ_API_KEY is missing.")

	url = "https://api.groq.com/openai/v1/chat/completions"
	headers = {
	"Authorization": f"Bearer {GROQ_API_KEY}",
	"Content-Type": "application/json"
	}
	payload = {
	"model": GROQ_MODEL,
	"messages": messages,
	"temperature": TEMPERATURE,
	"max_tokens": MAX_TOKENS,
	}

	for attempt in range(3): # Retry logic
	try:
	print(f"🔄 Attempt {attempt + 1} - Sending request to Groq API")
	response = requests.post(url, headers=headers, json=payload, timeout=60)
	print(f"📊 Status Code: {response.status_code}")

	if response.status_code == 200:
	result = response.json()
	if "choices" in result and len(result["choices"]) > 0:
	generated_text = result["choices"][0]["message"]["content"]
	return generated_text
	return "No response generated"

	elif response.status_code == 401: # Unauthorized (Invalid API key)
	print("❌ Authentication error: Invalid API Key")
	raise HTTPException(status_code=401, detail="Invalid API Key. Check your GROQ_API_KEY.")

	elif response.status_code == 429: # Rate limit error
	print("⚠️ Rate limited, retrying...")
	time.sleep(2 ** attempt) # Exponential backoff
	continue

	elif response.status_code == 503: # Service unavailable
	print("⚠️ Service unavailable, retrying...")
	time.sleep(2 ** attempt)
	continue

	else:
	error_detail = "Unknown error"
	try:
	error_data = response.json()
	error_detail = error_data.get("error", {}).get("message", str(error_data))
	except:
	error_detail = response.text

	print(f"❌ API Error: {error_detail}")
	if attempt == 2: # Last attempt
	raise HTTPException(status_code=response.status_code,
	detail=f"Groq API Error: {error_detail}")

	except requests.exceptions.Timeout:
	print("⚠️ Request timed out, retrying...")
	if attempt == 2: # Last attempt
	raise HTTPException(status_code=504, detail="Request timed out")

	except requests.exceptions.ConnectionError:
	print("⚠️ Connection error, retrying...")
	if attempt == 2: # Last attempt
	raise HTTPException(status_code=503, detail="Could not connect to Groq API")

	except Exception as e:
	print(f"❌ Unexpected error: {str(e)}")
	if attempt == 2: # Last attempt
	raise HTTPException(status_code=500, detail=f"Unexpected error: {str(e)}")

	# Wait before retry (except on last attempt)
	if attempt < 2:
	time.sleep(2 ** attempt)

	raise HTTPException(status_code=500, detail="Failed to get response after multiple attempts")


	# Helper function to process and format the model's response
	def process_response(raw_response: str, response_type: str) -> Dict[str, Any]:
	"""Process and format the model's response based on the requested type."""

	# For conversational responses, don't try to extract code
	if response_type == "conversation":
	return {"response": raw_response}

	elif response_type == "code":
	# Extract code blocks with regex
	code_match = re.search(r"```(?:python\|javascript\|java\|cpp\|c\+\+)?\n(.*?)\n```", raw_response, re.DOTALL)
	if code_match:
	return {"generated_code": code_match.group(1).strip()}
	# If no code block found, return the whole response as code
	return {"generated_code": raw_response}

	elif response_type == "explanation":
	# Remove code blocks
	explanation = re.sub(r"```(?:\w+)?\n.*?\n```", "", raw_response, flags=re.DOTALL).strip()
	return {"explanation": explanation}

	else: # "both"
	code = None
	explanation = raw_response

	# Extract code blocks
	code_match = re.search(r"```(?:python\|javascript\|java\|cpp\|c\+\+)?\n(.*?)\n```", raw_response, re.DOTALL)
	if code_match:
	code = code_match.group(1).strip()
	# Remove code blocks from explanation
	explanation = re.sub(r"```(?:\w+)?\n.*?\n```", "", raw_response, flags=re.DOTALL).strip()

	return {
	"response": raw_response,
	"generated_code": code,
	"explanation": explanation
	}


	# API route for generating responses
	@app.post("/generate/")
	async def generate_response(request: PromptRequest):
	"""Handles incoming user requests, maintains session history, and calls Groq model."""
	try:
	session_id = request.session_id or str(uuid.uuid4())

	if session_id not in conversation_history:
	conversation_history[session_id] = []

	# Classify the message type first
	message_type = classify_message(request.prompt)

	# Build messages array for Groq API (OpenAI format)
	messages = []

	# Add system message based on response type
	if message_type == "conversation":
	system_prompt = "You are a helpful and friendly AI assistant. Engage in natural conversation and answer questions clearly."
	else:
	if request.response_type == "code":
	system_prompt = "You are an expert programmer. Provide clean, efficient code solutions. Always wrap code in markdown code blocks with the appropriate language tag."
	elif request.response_type == "explanation":
	system_prompt = "You are a programming tutor. Explain programming concepts clearly without providing code. Focus on the approach and logic."
	else: # both
	system_prompt = "You are an expert programmer and teacher. Provide clear explanations followed by well-commented code examples. Always wrap code in markdown code blocks."

	messages.append({"role": "system", "content": system_prompt})

	# Add conversation history (last 6 messages to keep context manageable)
	if conversation_history[session_id]:
	for msg in conversation_history[session_id][-6:]:
	messages.append(msg)

	# Add current user message
	messages.append({"role": "user", "content": request.prompt})

	# Get response from Groq model
	print(f"📤 Sending {len(messages)} messages to Groq...")
	generated_response = generate_response_groq(messages)
	print(f"✅ Received response of length: {len(generated_response)}")

	# Store conversation history in OpenAI message format
	conversation_history[session_id].append({"role": "user", "content": request.prompt})
	conversation_history[session_id].append({"role": "assistant", "content": generated_response})

	# Limit history size to prevent memory issues (keep last 20 messages = 10 exchanges)
	if len(conversation_history[session_id]) > 20:
	conversation_history[session_id] = conversation_history[session_id][-20:]

	# For conversational messages, return directly without code/explanation processing
	if message_type == "conversation":
	response_data = {
	"response": generated_response,
	"message_type": "conversation"
	}
	else:
	# Handle response type and build response data for code-related messages
	response_data = process_response(generated_response, request.response_type)
	response_data["message_type"] = "code"

	response_data["session_id"] = session_id
	return response_data

	except HTTPException as e:
	# Re-raise HTTP exceptions to maintain status codes
	raise
	except Exception as e:
	print(f"❌ Unexpected error in generate_response: {str(e)}")
	raise HTTPException(status_code=500, detail=f"Unexpected error: {str(e)}")


	# API route for clearing conversation history
	@app.post("/clear_history/")
	async def clear_history(request: HistoryRequest):
	"""Clears conversation history for a given session."""
	if request.session_id in conversation_history:
	conversation_history[request.session_id] = []
	return {"status": "success", "message": "Conversation history cleared"}
	return {"status": "not_found", "message": "Session ID not found"}


	# API route for getting conversation history
	@app.post("/get_history/")
	async def get_history(request: HistoryRequest):
	"""Gets conversation history for a given session."""
	if request.session_id in conversation_history:
	return {
	"status": "success",
	"history": conversation_history[request.session_id]
	}
	return {"status": "not_found", "message": "Session ID not found"}


	# Health check endpoint
	@app.get("/")
	@app.get("/health")
	async def health_check():
	"""Health check endpoint to verify the API is running."""
	return {
	"status": "ok",
	"service": "Groq Code Generation API",
	"model": GROQ_MODEL,
	"version": "1.0.0"
	}


	# Request logging middleware for debugging
	@app.middleware("http")
	async def log_requests(request: Request, call_next):
	"""Log all incoming requests for debugging."""
	start_time = time.time()
	response = await call_next(request)
	process_time = time.time() - start_time
	print(f"📝 {request.method} {request.url.path} → Status: {response.status_code} ({process_time:.2f}s)")
	return response


	if __name__ == "__main__":
	import uvicorn
	port = int(os.getenv("PORT", "7860")) # Hugging Face Spaces uses port 7860
	uvicorn.run(app, host="0.0.0.0", port=port)