Spaces:

anthonym21
/

ask-my-research

Running

App Files Files Community

anthonym21 commited on 28 days ago

Commit

fdae7a6

1 Parent(s): 1649f04

Fix Gradio 5.x ChatInterface compatibility - add type='messages'

Browse files

Files changed (1) hide show

app.py +18 -46

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ import spaces
 import torch
 import faiss
 from sentence_transformers import SentenceTransformer
-from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
 # =============================================================================
 # Configuration
@@ -182,7 +182,7 @@ def format_citations(retrieved_chunks: list[dict]) -> str:
 # Generation with ZeroGPU
 # =============================================================================
-@spaces.GPU(duration=60)
 def generate_response(query: str, context: str) -> str:
     """Generate response using the LLM with ZeroGPU."""
@@ -236,25 +236,25 @@ Provide a helpful answer based ONLY on the context above. If the context doesn't
 # Chat Function
 # =============================================================================
-def chat(message: str, history: list, request: gr.Request) -> tuple[str, list]:
     """Main chat function."""
     # Rate limit check
     allowed, error_msg = check_rate_limit(request)
     if not allowed:
-        return error_msg, history
     if not message.strip():
-        return "Please enter a question.", history
     if faiss_index is None:
-        return "The paper index is not loaded. Please check the Space configuration.", history
     # Retrieve relevant chunks
     retrieved = retrieve(message)
     if not retrieved:
-        return "I couldn't find relevant information in the indexed papers.", history
     # Format context
     context = format_context(retrieved)
@@ -263,14 +263,14 @@ def chat(message: str, history: list, request: gr.Request) -> tuple[str, list]:
     try:
         response = generate_response(message, context)
     except Exception as e:
-        return f"Error generating response: {str(e)}", history
     # Add citations
     citations = format_citations(retrieved)
     if citations:
         response = f"{response}\n\n**Sources:**\n{citations}"
-    return response, history + [[message, response]]
 # =============================================================================
@@ -278,7 +278,7 @@ def chat(message: str, history: list, request: gr.Request) -> tuple[str, list]:
 # =============================================================================
 DESCRIPTION = """
-# Ask My Research
 Chat with Anthony Maio's AI safety research papers. Ask questions about:
@@ -300,45 +300,17 @@ EXAMPLES = [
     "How do weak verifiers fail to detect deceptive reasoning?",
 ]
-with gr.Blocks(
     title="Ask My Research",
     theme=gr.themes.Soft(
         primary_hue="orange",
-        secondary_hue="amber",
-    )
-) as demo:
-    gr.Markdown(DESCRIPTION)
-    chatbot = gr.Chatbot(
-        label="Conversation",
-        height=400,
-        show_copy_button=True,
-    )
-    with gr.Row():
-        msg = gr.Textbox(
-            label="Your question",
-            placeholder="Ask about the research papers...",
-            scale=4,
-            show_label=False,
-        )
-        submit = gr.Button("Ask", variant="primary", scale=1)
-    gr.Examples(
-        examples=EXAMPLES,
-        inputs=msg,
-        label="Example questions"
-    )
-    gr.Markdown("""
-    ---
-    *Rate limited to 20 questions/hour. Built by [Anthony Maio](https://making-minds.ai) | [Research Papers](https://making-minds.ai/research)*
-    """)
-    # Event handlers
-    msg.submit(chat, [msg, chatbot], [msg, chatbot])
-    submit.click(chat, [msg, chatbot], [msg, chatbot])
 if __name__ == "__main__":
     demo.launch()

 import torch
 import faiss
 from sentence_transformers import SentenceTransformer
+from transformers import AutoModelForCausalLM, AutoTokenizer
 # =============================================================================
 # Configuration
 # Generation with ZeroGPU
 # =============================================================================
+@spaces.GPU(duration=120)
 def generate_response(query: str, context: str) -> str:
     """Generate response using the LLM with ZeroGPU."""
 # Chat Function
 # =============================================================================
+def chat(message: str, history: list, request: gr.Request) -> str:
     """Main chat function."""
     # Rate limit check
     allowed, error_msg = check_rate_limit(request)
     if not allowed:
+        return error_msg
     if not message.strip():
+        return "Please enter a question."
     if faiss_index is None:
+        return "The paper index is not loaded. Please check the Space configuration."
     # Retrieve relevant chunks
     retrieved = retrieve(message)
     if not retrieved:
+        return "I couldn't find relevant information in the indexed papers."
     # Format context
     context = format_context(retrieved)
     try:
         response = generate_response(message, context)
     except Exception as e:
+        return f"Error generating response: {str(e)}"
     # Add citations
     citations = format_citations(retrieved)
     if citations:
         response = f"{response}\n\n**Sources:**\n{citations}"
+    return response
 # =============================================================================
 # =============================================================================
 DESCRIPTION = """
+# 🔬 Ask My Research
 Chat with Anthony Maio's AI safety research papers. Ask questions about:
     "How do weak verifiers fail to detect deceptive reasoning?",
 ]
+demo = gr.ChatInterface(
+    fn=chat,
+    type="messages",
     title="Ask My Research",
+    description=DESCRIPTION,
+    examples=EXAMPLES,
     theme=gr.themes.Soft(
         primary_hue="orange",
+        secondary_hue="yellow",
+    ),
+)
 if __name__ == "__main__":
     demo.launch()