Spaces:

Yas1n
/

CADomatic

Running

CADomatic / src /llm_client.py

YSMlearnsCode

added updated vectorstore and added prompts

7dae9af 5 months ago

3.29 kB

	import os
	from pathlib import Path
	from huggingface_hub import hf_hub_download
	from langchain_community.vectorstores import FAISS
	from langchain_google_genai import ChatGoogleGenerativeAI, GoogleGenerativeAIEmbeddings
	from langchain.memory import ConversationBufferMemory
	from langchain.schema import HumanMessage, AIMessage
	from dotenv import load_dotenv
	from langchain_huggingface import HuggingFaceEmbeddings


	# Load GEMINI API key
	load_dotenv()
	GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
	if not GEMINI_API_KEY:
	raise ValueError("GEMINI_API_KEY missing in .env")

	# FAISS vectorstore setup
	REPO_ID = "Yas1n/CADomatic_vectorstore"
	FILENAME_FAISS = "index.faiss"
	FILENAME_PKL = "index.pkl"

	BASE_PROMPT_PATH = Path(__file__).parent.parent / "prompts" / "base_instruction.txt"
	if not BASE_PROMPT_PATH.exists():
	raise FileNotFoundError(f"Base instruction file not found: {BASE_PROMPT_PATH}")
	with open(BASE_PROMPT_PATH, "r", encoding="utf-8") as f:
	BASE_INSTRUCTIONS = f.read().strip()

	faiss_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME_FAISS)
	pkl_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME_PKL)
	download_dir = Path(faiss_path).parent

	embedding = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
	vectorstore = FAISS.load_local(
	str(download_dir),
	embeddings=embedding,
	allow_dangerous_deserialization=True,
	index_name="index"
	)
	retriever = vectorstore.as_retriever(search_kwargs={"k": 15})

	# Conversation memory
	memory = ConversationBufferMemory(return_messages=True)

	# Gemini 2.5 Flash (LangChain wrapper, no genai import needed)
	llm = ChatGoogleGenerativeAI(
	model="gemini-2.5-flash",
	temperature=0.7,
	api_key=GEMINI_API_KEY # Use the key directly
	)

	def build_prompt(user_prompt: str) -> str:
	"""Builds full prompt with RAG context and conversation history."""
	docs = retriever.invoke(user_prompt)
	context = "\n\n".join(doc.page_content for doc in docs)

	history_text = ""
	for msg in memory.chat_memory.messages:
	if isinstance(msg, HumanMessage):
	history_text += f"User: {msg.content}\n"
	elif isinstance(msg, AIMessage):
	history_text += f"Assistant: {msg.content}\n"

	return f"""
	You are a helpful assistant that writes FreeCAD Python scripts from CAD instructions.
	Use the following FreeCAD wiki documentation as context:

	{context}

	Here are a few important instructions for you to follow
	{BASE_INSTRUCTIONS}

	Here is the conversation so far:
	{history_text}

	Current instruction:
	{user_prompt}

	Respond with valid FreeCAD 1.0.1 Python code only, no extra comments.
	"""

	def prompt_llm(user_prompt: str) -> str:
	"""Generate FreeCAD code using Gemini 2.5 Flash."""
	final_prompt = build_prompt(user_prompt)
	try:
	response = llm.invoke(final_prompt)
	result = response.content.strip()

	# Save user and AI messages in memory
	memory.chat_memory.add_user_message(user_prompt)
	memory.chat_memory.add_ai_message(result)

	return result
	except Exception as e:
	print("❌ Error generating FreeCAD code:", e)
	return ""

	def reset_memory():
	"""Clear conversation history."""
	global memory
	memory = ConversationBufferMemory(return_messages=True)