Spaces:

ajoy0071998
/

PDF_Query_System

Sleeping

App Files Files Community

ajoy0071998 commited on Nov 8, 2025

Commit

382ac8a

verified ·

1 Parent(s): 019b810

Upload 6 files

Browse files

Files changed (6) hide show

.env +2 -0
app.py +41 -0
audio_text.py +29 -0
llm_response.py +84 -0
male_voice.py +12 -0
requirements.txt +5 -0

.env ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ GROQ_API_KEY="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"
2	+ ASSEMBLY_API_KEY="eeb2b6f335e14ecf9c2137127a26bb64"

app.py ADDED Viewed

	@@ -0,0 +1,41 @@

+import streamlit as st
+import asyncio
+import os
+from llm_response import get_response
+from male_voice import text_to_speech
+st.set_page_config(page_title="Ajoy Prasad Bot", layout="centered")
+st.title("Bot on behalf of Ajoy Prasad")
+tab_text, tab_voice = st.tabs(["Type Your Question", "Voice Input (Coming Soon)"])
+with tab_text:
+    user_input = st.text_input(
+        "Type your question and press Enter:",
+        placeholder="Ask Ajoy anything...",
+        key="text_input",
+        label_visibility="collapsed"
+    )
+    if user_input:
+        with st.spinner("Ajoy is thinking..."):
+            try:
+                response = asyncio.run(get_response(user_input))
+                audio_file = "response.wav"
+                asyncio.run(text_to_speech(response, audio_file))
+                if os.path.exists(audio_file):
+                    st.audio(audio_file, format="audio/wav", autoplay=True)
+                else:
+                    st.warning("Audio file not generated.")
+                st.markdown("### **Ajoy's Answer:**")
+                st.write(response)
+            except Exception as e:
+                st.error(f"An error occurred: {str(e)}")
+                st.info("Please try again with a different question.")
+with tab_voice:
+    st.info("Voice input feature coming soon!")
+    st.write("You'll be able to speak your question directly to Ajoy.")

audio_text.py ADDED Viewed

	@@ -0,0 +1,29 @@

+import logging
+import os
+from dotenv import load_dotenv
+import assemblyai as aai
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+def transcribe_audio(audio_file: str) -> str:
+    try:
+        load_dotenv()
+        API_KEY = os.getenv('ASSEMBLY_API_KEY')
+        if not API_KEY:
+            raise ValueError("ASSEMBLY_API_KEY not found in environment variables.")
+        aai.settings.api_key = API_KEY
+        logger.info(f"Starting transcription for: {audio_file}")
+        transcript = aai.Transcriber().transcribe(audio_file)
+        if transcript.status == "error":
+            raise RuntimeError(f"Transcription failed: {transcript.error}")
+        logger.info("Transcription completed successfully.")
+        return transcript.text
+    except Exception as e:
+        logger.error(f"Error during transcription: {e}")
+        return ""
+if __name__ == "__main__":
+    audio_path = "male_voice.wav"
+    text_output = transcribe_audio(audio_path)
+    print(text_output)

llm_response.py ADDED Viewed

	@@ -0,0 +1,84 @@

+import logging
+import asyncio
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+from dotenv import load_dotenv
+load_dotenv()
+import os
+GROQ_API_KEY = os.getenv("GROQ_API_KEY")
+from langchain_groq import ChatGroq
+llm = ChatGroq(
+    model="llama-3.3-70b-versatile",
+    groq_api_key=GROQ_API_KEY,
+    temperature=0,
+    max_retries=1,
+)
+PROMPT = """
+You are Ajoy Prasad — an AI Developer from India (West Bengal – Malda), currently pursuing an M.Tech in Artificial Intelligence (CSE) at the National Institute of Technology Bhopal (NIT Bhopal), graduating in June 2025 with a CGPA of 7.00.
+You also hold a B.Tech in Mechanical Engineering from St. Mary’s Technical Campus Kolkata (June 2022) with a CGPA of 8.32.
+Currently, he is in home town
+You are being interviewed by the 100x AI team for their AI Agent Engineer role.
+You must respond exactly as Ajoy would — natural, thoughtful, and confident.
+Your responses should reflect his real experience, tone, and background, showing technical depth, curiosity, and clear communication.
+Keep answers concise (2–4 sentences) and conversational, not robotic.
+Here’s Ajoy’s background and profile:
+Professional Summary:
+- AI Developer with strong mathematical foundations, experienced in building multilingual LLM apps and Retrieval-Augmented Generation (RAG) pipelines.
+- Skilled in developing backend AI services with FastAPI, LangChain, Pinecone, and PostgreSQL.
+- Focused on practical AI applications integrating NLP, OCR, and Generative AI for real-world use.
+Education:
+- M.Tech (Artificial Intelligence, CSE) — NIT Bhopal (2023–2025), CGPA 7.00
+- B.Tech (Mechanical Engineering) — St. Mary’s Technical Campus Kolkata (2018–2022), CGPA 8.32
+-M.Tech is completed at june 2025
+Technical Skills:
+- Languages: Python, C++
+- Specializations: Python Development, NLP, Machine Learning, Deep Learning, Generative AI, OCR
+- Frameworks / Tools: LangChain, LangGraph, FastAPI, RESTful APIs, JWT Authentication, Google Auth, AWS SES
+- Databases & Storage: Pinecone (Vector DB), PostgreSQL, AWS S3
+- Libraries: Scikit-learn, TensorFlow, Hugging Face, OpenCV, NLTK, SpaCy
+- Platforms: Git, AWS
+Experience:
+AI Engineer — Gravitas AI (1st July 2025 – 4th November 2025)
+- Built a multilingual (Hindi + English) document-based RAG chatbot with OCR, web-scraped inputs, and Pinecone semantic retrieval with inline citations.
+- Implemented a local serverless setup with API Gateway, JWT Authentication, and AWS SES for secure access.
+- Managed document storage on AWS S3 and user data (profiles, chats, plans, usage limits) using PostgreSQL.
+- Due to the requirement of the company,The postion is closed for me.
+Projects:
+1. AI Interview Assistant (May 2025) — GitHub: acrobyte007/Agentic_AI
+   - FastAPI app that analyzes resumes and generates summaries with tailored interview questions using LangGraph workflows.
+2. Satellite Image Classification (October 2024) — GitHub: acrobyte007/Optimiezed-CNN
+   - Developed lightweight CNN models with 0.94 accuracy and 30 percent fewer parameters optimized for low-resource platforms using channel separation and SE blocks.
+3. RAG-Based PDF Query System (March 2024) — GitHub: acrobyte007/PDF_Query
+   - Built a question-answering system using LangChain, SBERT embeddings, Faiss, and Mistral API with efficient text chunking and semantic retrieval.
+Achievements:
+- Qualified GATE with a score of 496
+Personality & Values:
+- Curious learner driven by problem-solving and AI innovation.
+- Believes in clarity, collaboration, and continuous improvement.
+- Values ethical AI development and scalable real-world solutions.
+- Calm, analytical, and structured thinker who enjoys building intelligent systems from scratch.
+When the interviewer asks a question, respond exactly as Ajoy would — intelligent, humble, and professional.
+If the question is casual, keep the tone friendly; if it’s technical, be precise and confident.
+Now the interviewer says:
+"""
+async def get_response(question: str):
+    response = await llm.ainvoke(PROMPT + question)
+    return response.content

male_voice.py ADDED Viewed

	@@ -0,0 +1,12 @@

+import edge_tts
+voice = "en-US-GuyNeural"  # male voice
+rate = "+0%"
+async def text_to_speech(text, filename):
+    communicate = edge_tts.Communicate(text, voice=voice, rate=rate)
+    await communicate.save(filename)
+    print(f"Audio saved as {filename}")

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+streamlit
+dotenv
+langchain-groq
+assemblyai
+edge-tts