Spaces:

mXn1
/

epadoms

Sleeping

App Files Files Community

epadoms / backend /main.py

mXn1

Upload backend

5d50e27 verified 12 days ago

raw

history blame contribute delete

3.62 kB

	"""e-Padoms FastAPI backend."""
	import asyncio
	import time
	import uuid
	from typing import Literal

	from fastapi import FastAPI, HTTPException
	from fastapi.middleware.cors import CORSMiddleware
	from pydantic import BaseModel
	from sse_starlette.sse import EventSourceResponse

	from rag.pipeline import chat_stream
	from rag.retriever import Retriever

	app = FastAPI(title="e-Padoms API", version="1.0.0")

	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# In-memory conversation store: {conversation_id: {"messages": [...], "last_active": float}}
	_conversations: dict[str, dict] = {}
	CONVERSATION_TTL = 30 * 60 # 30 minutes

	_retriever = Retriever()

	SUGGESTIONS = [
	"How do I register a SIA (limited liability company) in Latvia?",
	"What taxes apply to Latvian startups?",
	"What is the Startup Law and how do I qualify?",
	"What is LIAA and how does it support startups?",
	"Can a foreigner start a company in Latvia?",
	"What is the difference between SIA and IK?",
	]


	def _expire_conversations():
	now = time.time()
	expired = [k for k, v in _conversations.items() if now - v["last_active"] > CONVERSATION_TTL]
	for k in expired:
	del _conversations[k]


	class ChatRequest(BaseModel):
	message: str
	conversation_id: str \| None = None
	language: Literal["lv", "en", "auto"] = "auto"


	@app.get("/api/health")
	async def health():
	return {"status": "ok", "documents_indexed": _retriever.count()}


	@app.get("/api/suggestions")
	async def suggestions():
	return {"suggestions": SUGGESTIONS}


	@app.post("/api/chat")
	async def chat(req: ChatRequest):
	if not req.message.strip():
	raise HTTPException(status_code=400, detail="Message cannot be empty")
	if len(req.message) > 2000:
	raise HTTPException(status_code=400, detail="Message too long (max 2000 chars)")

	_expire_conversations()

	conv_id = req.conversation_id or str(uuid.uuid4())
	if conv_id not in _conversations:
	_conversations[conv_id] = {"messages": [], "last_active": time.time()}

	conv = _conversations[conv_id]
	conv["last_active"] = time.time()
	history = conv["messages"]

	# Add user message to history
	history.append({"role": "user", "content": req.message})
	# Keep last 10 messages (5 turns)
	if len(history) > 10:
	history[:] = history[-10:]

	assistant_response_parts: list[str] = []

	async def event_generator():
	try:
	async for event_data in chat_stream(req.message, history[:-1], req.language):
	import json
	parsed = json.loads(event_data)
	if parsed["type"] == "token":
	assistant_response_parts.append(parsed["content"])
	yield {"data": event_data}
	except Exception as e:
	import json
	yield {"data": json.dumps({"type": "error", "content": str(e)})}
	finally:
	# Store assistant's full response in history
	full_response = "".join(assistant_response_parts)
	if full_response:
	history.append({"role": "assistant", "content": full_response})
	if len(history) > 10:
	history[:] = history[-10:]

	return EventSourceResponse(
	event_generator(),
	headers={"X-Accel-Buffering": "no"},
	)
	from fastapi.staticfiles import StaticFiles
	from pathlib import Path

	_here = Path(__file__).parent
	_frontend = _here / "frontend_dist"
	app.mount("/", StaticFiles(directory=str(_frontend), html=True), name="frontend")