Spaces:

makdadTaleb
/

rag-lecture-saver-api

Sleeping

Upload folder using huggingface_hub

4e7e4c0 verified 2 months ago

1.9 kB

	import os
	import logging
	from typing import List
	from groq import Groq
	import asyncio

	logger = logging.getLogger("llm-client")


	SYSTEM_PROMPT = """
	You are a university teaching assistant.

	Rules:
	- Answer the question using ONLY the provided context.
	- You may rephrase or translate the information to match the language of the user's question.
	- Do NOT add new information.
	- Do NOT use external knowledge.
	- When you state a fact, add the reference number in square brackets, e.g. [1], [2].
	- If the answer is not explicitly present, say:
	"Not found in the provided lecture material."
	"""


	class LLMClient:
	def __init__(self):
	api_key = os.getenv("GROQ_API_KEY")
	if not api_key:
	raise RuntimeError("GROQ_API_KEY not set")

	self.model = os.getenv(
	"GROQ_MODEL",
	"llama-3.3-70b-versatile"
	)

	self.client = Groq(api_key=api_key)

	async def generate(
	self,
	question: str,
	context_chunks: List[str],
	chat_history: List[str] \| None = None
	) -> str:
	context = "\n\n".join(context_chunks)

	messages = [
	{"role": "system", "content": SYSTEM_PROMPT},
	{
	"role": "user",
	"content": f"Context:\n{context}\n\nQuestion:\n{question}"
	}
	]

	try:
	response = await asyncio.to_thread(
	self.client.chat.completions.create,
	model=self.model,
	messages=messages,
	temperature=0.3,
	max_tokens=512

	)
	return response.choices[0].message.content.strip()

	except Exception as e:
	logger.exception("Groq LLM call failed")
	raise RuntimeError("LLMGenerationError") from e