Spaces:

Harshita-27
/

Askmydocs

Sleeping

Askmydocs / src /chat_model.py

HarshitaBhatia27

Speed up PDF indexing: batch embeddings, reduce chunk overlap, add size warning

12d7ca8 about 2 months ago

643 Bytes

	import os
	from langchain_groq import ChatGroq
	from langchain_huggingface import HuggingFaceEmbeddings

	def get_llm():
	api_key = os.environ.get("GROQ_API_KEY")
	print(f"DEBUG: GROQ_API_KEY present = {bool(api_key)}, length = {len(api_key) if api_key else 0}")
	return ChatGroq(model="llama-3.3-70b-versatile", groq_api_key=api_key)

	def get_embeddings():
	return HuggingFaceEmbeddings(
	model_name="BAAI/bge-small-en",
	encode_kwargs={
	"batch_size": 64, # process 64 chunks at once instead of 1
	"normalize_embeddings": True # BGE models are trained with normalization
	}
	)