Spaces:

PraneshJs
/

thiruvasagmbot

Sleeping

App Files Files Community

PraneshJs commited on Aug 31, 2025

Commit

2a078d1

verified ·

1 Parent(s): 8d19e5d

added app.py to hf space

Browse files

Files changed (1) hide show

app.py +58 -0

app.py ADDED Viewed

	@@ -0,0 +1,58 @@

+import os
+import gradio as gr
+from openai import AzureOpenAI
+from sentence_transformers import SentenceTransformer
+from langchain.document_loaders import PyPDFLoader
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain.vectorstores import Chroma
+# Load PDF (Tiruvāsagam)
+loader = PyPDFLoader("tiru.pdf")
+docs = loader.load()
+# Split into chunks
+splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
+chunks = splitter.split_documents(docs)
+# Local embedding model (Tamil capable)
+embedding_model = SentenceTransformer("intfloat/multilingual-e5-large")
+def embed(texts): return embedding_model.encode(texts, convert_to_numpy=True)
+# Store in Chroma
+vectorstore = Chroma.from_documents(chunks, embedding_function=embed)
+retriever = vectorstore.as_retriever(search_type="similarity", search_kwargs={"k":3})
+# Azure OpenAI client
+client = AzureOpenAI(
+    api_key=os.getenv("AZURE_OPENAI_API_KEY"),
+    api_version="2025-01-01-preview",
+    azure_endpoint=os.getenv("AZURE_OPENAI_ENDPOINT")
+)
+# Chat function
+def chat_fn(message, history):
+    # Retrieve relevant chunks
+    docs = retriever.get_relevant_documents(message)
+    context = "\n\n".join([d.page_content for d in docs])
+    # Call Azure OpenAI (GPT-4)
+    completion = client.chat.completions.create(
+        model="gpt-4.1",  # your Azure deployment name
+        messages=[
+            {"role": "system", "content": "You are a helpful assistant answering from Tiruvāsagam.Message in tamil maximum the tamil should be basic without any spelling and grammer mistakes in it. Be as token effecient. Mainly for any question not related to Thiruvasagam or lord Shiva or Author manichavasagar just reply I have no knowlage or I don't know i tamil use only tamil i say it again"},
+            {"role": "user", "content": f"Context:\n{context}\n\nQuestion: {message}"}
+        ],
+        temperature=0.8,
+        max_token=500
+    )
+    return completion.choices[0].message.content
+# Gradio UI
+chatbot = gr.ChatInterface(
+    fn=chat_fn,
+    title="திருவாசகம் RAG Chatbot",
+    description="திருவாசகத்தை அடிப்படையாகக் கொண்டு கேள்விகளை கேளுங்கள் (Tamil/English supported)."
+)
+if __name__ == "__main__":
+    chatbot.launch(server_name="0.0.0.0", server_port=7860, debug=True)