Spaces:

philipk22
/

fastapi-rag-react

Sleeping

App Files Files Community

fastapi-rag-react / backend /main.py

philipk22

change Dockerfile

9871eb4 about 1 year ago

raw

history blame contribute delete

4.95 kB

	from fastapi import FastAPI, UploadFile, File, HTTPException
	from fastapi.middleware.cors import CORSMiddleware
	from fastapi.responses import JSONResponse
	from fastapi.staticfiles import StaticFiles
	from pydantic import BaseModel
	from typing import List
	import os
	from dotenv import load_dotenv
	import tempfile
	import logging

	# Set up logging
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	# Update imports to use relative paths
	from .text_utils import CharacterTextSplitter, TextFileLoader, PDFLoader
	from .openai_utils import SystemRolePrompt, UserRolePrompt, ChatOpenAI
	from .vector_store import VectorDatabase

	load_dotenv()

	app = FastAPI()

	# Configure CORS - update to be more specific
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["http://localhost:8000", "http://localhost:3000", "http://127.0.0.1:8000", "http://127.0.0.1:3000"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# Prompt templates
	system_template = """\
	Use the following context to answer a users question. If you cannot find the answer in the context, say you don't know the answer."""
	system_role_prompt = SystemRolePrompt(system_template)

	user_prompt_template = """\
	Context:
	{context}

	Question:
	{question}
	"""
	user_role_prompt = UserRolePrompt(user_prompt_template)

	# Initialize components
	text_splitter = CharacterTextSplitter()
	chat_openai = ChatOpenAI()

	# Store vector databases for each session
	vector_dbs = {}

	class QueryRequest(BaseModel):
	session_id: str
	query: str

	@app.post("/upload")
	async def upload_file(file: UploadFile = File(...)):
	try:
	# Use tempfile instead of direct file writing
	with tempfile.NamedTemporaryFile(delete=False) as temp_file:
	content = await file.read()
	temp_file.write(content)
	file_path = temp_file.name

	# Process file
	loader = PDFLoader(file_path) if file.filename.lower().endswith('.pdf') else TextFileLoader(file_path)
	documents = loader.load_documents()
	texts = text_splitter.split_texts(documents)

	# Create vector database
	vector_db = VectorDatabase()
	vector_db = await vector_db.abuild_from_list(texts)

	# Generate session ID and store vector_db
	import uuid
	session_id = str(uuid.uuid4())
	vector_dbs[session_id] = vector_db

	# Cleanup
	os.unlink(file_path)

	# Change the response to include a header that prevents the popup
	return JSONResponse(
	content={"session_id": session_id, "message": "File processed successfully"},
	headers={
	"Content-Type": "application/json",
	"X-Content-Type-Options": "nosniff"
	}
	)

	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))

	@app.post("/query")
	async def query(request: QueryRequest):
	try:
	logger.info(f"Received query request with session_id: {request.session_id}")
	vector_db = vector_dbs.get(request.session_id)
	if not vector_db:
	logger.error(f"Session not found: {request.session_id}")
	raise HTTPException(status_code=404, detail="Session not found")

	# Retrieve context
	logger.info(f"Searching for context with query: {request.query}")
	context_list = await vector_db.search_by_text(request.query, k=4)
	context_prompt = "\n".join([str(context[0]) for context in context_list])

	# Generate prompts
	formatted_system_prompt = system_role_prompt.create_message()
	formatted_user_prompt = user_role_prompt.create_message(
	question=request.query,
	context=context_prompt
	)

	# Get response
	logger.info("Getting response from OpenAI")
	response = await chat_openai.acomplete(
	[formatted_system_prompt, formatted_user_prompt]
	)
	logger.info(f"Got response: {response}")

	return {
	"answer": str(response),
	"context": [str(context[0]) for context in context_list]
	}

	except Exception as e:
	logger.error(f"Error processing query: {str(e)}", exc_info=True)
	raise HTTPException(status_code=500, detail=str(e))

	# Optional: Cleanup endpoint
	@app.delete("/session/{session_id}")
	async def cleanup_session(session_id: str):
	if session_id in vector_dbs:
	del vector_dbs[session_id]
	return {"message": "Session cleaned up successfully"}
	raise HTTPException(status_code=404, detail="Session not found")

	# Keep the root endpoint
	# @app.get("/")
	# async def read_root():
	# return JSONResponse(content={"message": "API is running"})

	@app.get("/health")
	async def health_check():
	return {"status": "healthy"}

	# Move this to the end of the file, after all routes
	app.mount("/", StaticFiles(directory="/code/frontend/dist", html=True), name="static")