Spaces:

Mohit0708
/

AI-Research-Lab

Sleeping

App Files Files Community

Mohit0708 commited on 25 days ago

Commit

14d7aab

verified ·

1 Parent(s): a10d9c7

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -34

app.py CHANGED Viewed

@@ -15,24 +15,20 @@ from langchain_huggingface import HuggingFaceEmbeddings
 from langchain_community.vectorstores import Chroma
 # ==========================================
-# 2. CONNECT TO AI APIS (Replaces Local Models)
 # ==========================================
 print("⏳ Connecting to Hugging Face APIs...")
-# Get token from environment variable (Set this in HF Spaces Secrets)
 HF_TOKEN = os.environ.get("HF_TOKEN")
 if not HF_TOKEN:
     print("⚠️ WARNING: HF_TOKEN not found! The AI will not be able to generate responses.")
-# --- A. Mistral-7B API (The Writer/Scientist) ---
-text_client = InferenceClient("mistralai/Mistral-7B-Instruct-v0.3", token=HF_TOKEN)
-# --- B. Qwen2-VL API (The Eye) ---
-# We use the 7B version since the cloud API handles the compute!
-vision_client = InferenceClient("Qwen/Qwen2-VL-7B-Instruct", token=HF_TOKEN)
-# --- C. Local Embeddings & Whisper (Runs fine on CPU) ---
 embedding_model = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
 whisper_model = whisper.load_model("base")
@@ -59,7 +55,6 @@ def save_to_json(user_msg, combined_ans, mode):
     with open(chat_history_file, "w") as f: json.dump(history, f, indent=4)
 def process_pdf_to_markdown(pdf_path, extract_images=True):
-    """Converts PDF to Markdown. Optionally extracts images."""
     global main_extracted_images
     output_image_dir = "extracted_images"
@@ -80,7 +75,6 @@ def process_pdf_to_markdown(pdf_path, extract_images=True):
     except Exception as e:
         return ""
-# --- UPLOAD HANDLER 1: MAIN PAPER ---
 def process_main_paper(file_obj):
     global main_paper_retriever
     main_paper_retriever = None
@@ -97,7 +91,6 @@ def process_main_paper(file_obj):
     except Exception as e:
         return f"❌ Error: {str(e)}"
-# --- UPLOAD HANDLER 2: REFERENCE SET ---
 def process_brainstorm_papers(file_list):
     global brainstorm_retriever
     brainstorm_retriever = None
@@ -126,27 +119,23 @@ def transcribe_audio(audio_path):
     return whisper_model.transcribe(audio_path)["text"].strip()
 # ==========================================
-# 4. INTELLIGENCE LAYERS (API WRAPPERS)
 # ==========================================
-# Helper function to call Mistral API
-# Helper function to call Mistral API (Updated for Conversational Task)
 def ask_mistral(prompt):
     try:
-        # Format the prompt as a chat message
         messages = [{"role": "user", "content": prompt}]
-        # Use chat_completion instead of text_generation
-        response = text_client.chat_completion(
-            messages=messages,
-            max_tokens=1000,
             temperature=0.3
         )
         return response.choices[0].message.content
     except Exception as e:
         return f"⚠️ API Error (Mistral): {str(e)}"
-# Helper function to call Qwen API
 def ask_qwen(prompt, image_paths):
     try:
         messages = [{"role": "user", "content": []}]
@@ -159,23 +148,26 @@ def ask_qwen(prompt, image_paths):
             })
         messages[0]["content"].append({"type": "text", "text": prompt})
-        response = vision_client.chat_completion(messages=messages, max_tokens=150)
         return response.choices[0].message.content
     except Exception as e:
-        return f"⚠️ API Error (Qwen - Server might be busy): {str(e)}"
 # MODE 1: CHAT WITH MAIN PAPER
 def get_main_paper_response(question):
     global main_paper_retriever, main_extracted_images
     vision_context = ""
-    # Vision Pass
     if main_extracted_images:
         images_to_process = main_extracted_images[:3]
         vision_prompt = f"Relate these images to: {question}"
         vision_context = ask_qwen(vision_prompt, images_to_process)
-    # Text Pass
     if main_paper_retriever:
         docs = main_paper_retriever.invoke(question)
         text_context = "\n\n".join(d.page_content for d in docs)
@@ -228,7 +220,6 @@ Context: {context}
 Task: Generate a draft for a paper about: {question} [/INST]"""
     return ask_mistral(prompt)
 # ==========================================
 # 5. GRADIO UI
 # ==========================================
@@ -239,7 +230,6 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("Pipeline: Analyze -> Find Novelty -> Design Setup -> Write Draft")
     with gr.Row():
-        # --- LEFT: CONTROLS ---
         with gr.Column(scale=1):
             mode_radio = gr.Radio(
@@ -264,7 +254,6 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             clear_btn = gr.Button("🗑️ Clear Workspace")
-        # --- RIGHT: WORKSPACE ---
         with gr.Column(scale=2):
             chatbot = gr.Chatbot(label="Lab Assistant", height=700)
             audio_input = gr.Audio(sources=["microphone"], type="filepath", label="🎤 Dictate Idea")
@@ -273,18 +262,15 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
                 msg_input = gr.Textbox(placeholder="Enter your query or research topic...", scale=4)
                 send_btn = gr.Button("🚀 Execute", variant="primary", scale=1)
-    # --- HANDLERS ---
     file_main.change(fn=process_main_paper, inputs=file_main, outputs=status_main)
     file_refs.change(fn=process_brainstorm_papers, inputs=file_refs, outputs=status_refs)
     audio_input.stop_recording(fn=transcribe_audio, inputs=audio_input, outputs=msg_input)
     clear_btn.click(fn=reset_chat, outputs=chatbot)
-    # --- MAIN ROUTER ---
     def respond(message, history, mode):
         if not message.strip(): return "", history
         if history is None: history = []
-        # Route based on selected Stage
         if mode == "1. Chat with Paper":
             response = get_main_paper_response(message)
         elif mode == "2. Brainstorm Novelty":
@@ -296,7 +282,6 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         else:
             response = "Error: Unknown Mode"
-        # Log & Update
         final_ans = f"**[{mode}]**\n{response}"
         save_to_json(message, final_ans, mode)
         history.append({"role": "user", "content": message})
@@ -308,5 +293,4 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     send_btn.click(respond, [msg_input, chatbot, mode_radio], [msg_input, chatbot])
 print("🚀 Launching Production Research Scientist Lab...")
-# In HF Spaces, we don't need share=True
 demo.launch()

 from langchain_community.vectorstores import Chroma
 # ==========================================
+# 2. CONNECT TO AI APIS (OpenAI-Compatible)
 # ==========================================
 print("⏳ Connecting to Hugging Face APIs...")
 HF_TOKEN = os.environ.get("HF_TOKEN")
 if not HF_TOKEN:
     print("⚠️ WARNING: HF_TOKEN not found! The AI will not be able to generate responses.")
+# Initialize a single, generic client
+# We do NOT bind the model name here to prevent the "text-generation" tagging error
+hf_client = InferenceClient(api_key=HF_TOKEN)
+# Local Embeddings & Whisper
 embedding_model = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
 whisper_model = whisper.load_model("base")
     with open(chat_history_file, "w") as f: json.dump(history, f, indent=4)
 def process_pdf_to_markdown(pdf_path, extract_images=True):
     global main_extracted_images
     output_image_dir = "extracted_images"
     except Exception as e:
         return ""
 def process_main_paper(file_obj):
     global main_paper_retriever
     main_paper_retriever = None
     except Exception as e:
         return f"❌ Error: {str(e)}"
 def process_brainstorm_papers(file_list):
     global brainstorm_retriever
     brainstorm_retriever = None
     return whisper_model.transcribe(audio_path)["text"].strip()
 # ==========================================
+# 4. INTELLIGENCE LAYERS (STRICT CHAT ROUTING)
 # ==========================================
 def ask_mistral(prompt):
     try:
         messages = [{"role": "user", "content": prompt}]
+        # This explicitly hits the /v1/chat/completions route
+        response = hf_client.chat.completions.create(
+            model="mistralai/Mistral-7B-Instruct-v0.3",
+            messages=messages,
+            max_tokens=1000,
             temperature=0.3
         )
         return response.choices[0].message.content
     except Exception as e:
         return f"⚠️ API Error (Mistral): {str(e)}"
 def ask_qwen(prompt, image_paths):
     try:
         messages = [{"role": "user", "content": []}]
             })
         messages[0]["content"].append({"type": "text", "text": prompt})
+        # Enforce chat completions route for Vision model too
+        response = hf_client.chat.completions.create(
+            model="Qwen/Qwen2-VL-7B-Instruct",
+            messages=messages,
+            max_tokens=150
+        )
         return response.choices[0].message.content
     except Exception as e:
+        return f"⚠️ API Error (Qwen - Server busy): {str(e)}"
 # MODE 1: CHAT WITH MAIN PAPER
 def get_main_paper_response(question):
     global main_paper_retriever, main_extracted_images
     vision_context = ""
     if main_extracted_images:
         images_to_process = main_extracted_images[:3]
         vision_prompt = f"Relate these images to: {question}"
         vision_context = ask_qwen(vision_prompt, images_to_process)
     if main_paper_retriever:
         docs = main_paper_retriever.invoke(question)
         text_context = "\n\n".join(d.page_content for d in docs)
 Task: Generate a draft for a paper about: {question} [/INST]"""
     return ask_mistral(prompt)
 # ==========================================
 # 5. GRADIO UI
 # ==========================================
     gr.Markdown("Pipeline: Analyze -> Find Novelty -> Design Setup -> Write Draft")
     with gr.Row():
         with gr.Column(scale=1):
             mode_radio = gr.Radio(
             clear_btn = gr.Button("🗑️ Clear Workspace")
         with gr.Column(scale=2):
             chatbot = gr.Chatbot(label="Lab Assistant", height=700)
             audio_input = gr.Audio(sources=["microphone"], type="filepath", label="🎤 Dictate Idea")
                 msg_input = gr.Textbox(placeholder="Enter your query or research topic...", scale=4)
                 send_btn = gr.Button("🚀 Execute", variant="primary", scale=1)
     file_main.change(fn=process_main_paper, inputs=file_main, outputs=status_main)
     file_refs.change(fn=process_brainstorm_papers, inputs=file_refs, outputs=status_refs)
     audio_input.stop_recording(fn=transcribe_audio, inputs=audio_input, outputs=msg_input)
     clear_btn.click(fn=reset_chat, outputs=chatbot)
     def respond(message, history, mode):
         if not message.strip(): return "", history
         if history is None: history = []
         if mode == "1. Chat with Paper":
             response = get_main_paper_response(message)
         elif mode == "2. Brainstorm Novelty":
         else:
             response = "Error: Unknown Mode"
         final_ans = f"**[{mode}]**\n{response}"
         save_to_json(message, final_ans, mode)
         history.append({"role": "user", "content": message})
     send_btn.click(respond, [msg_input, chatbot, mode_radio], [msg_input, chatbot])
 print("🚀 Launching Production Research Scientist Lab...")
 demo.launch()