Spaces:

bajajhackrx
/

model

Sleeping

App Files Files Community

sohamchitimali commited on Aug 6, 2025

Commit

8a6c8ae

1 Parent(s): bece185

Frontend Fix

Browse files

Files changed (1) hide show

app.py +187 -142

app.py CHANGED Viewed

@@ -666,164 +666,209 @@ class HighPerformanceSystem:
 # Initialize the system
 high_performance_system = HighPerformanceSystem()
-def process_hackathon_submission(document_url: str, questions_text: str) -> str:
-    """Main hackathon submission processing function"""
-    try:
-        if not document_url.strip():
-            return json.dumps({"error": "Document URL is required"}, indent=2)
-        if not questions_text.strip():
-            return json.dumps({"error": "Questions are required"}, indent=2)
-        try:
-            if questions_text.strip().startswith('['):
-                questions = json.loads(questions_text)
-            else:
-                questions = [q.strip() for q in questions_text.split('\n') if q.strip()]
-        except json.JSONDecodeError:
-            questions = [q.strip() for q in questions_text.split('\n') if q.strip()]
-        if not questions:
-            return json.dumps({"error": "No valid questions found"}, indent=2)
-        doc_result = high_performance_system.process_document_optimized(document_url)
-        if not doc_result.get('success'):
-            return json.dumps({"error": f"Document processing failed: {doc_result.get('error')}"}, indent=2)
-        batch_result = high_performance_system.process_batch_queries_optimized(questions)
-        response = {
-            "answers": [result['answer'] for result in batch_result['answers']],
-            "metrics": {
-                "total_processing_time": batch_result['processing_time'],
-                "average_confidence": np.mean([result['confidence'] for result in batch_result['answers']]) if batch_result['answers'] else 0.0,
-                "total_tokens": sum(result['token_count'] for result in batch_result['answers'])
-            }
-        }
-        return json.dumps(response, indent=2)
-    except Exception as e:
-        logger.error(f"Submission processing error: {e}")
-        return json.dumps({"error": f"System error: {str(e)}"}, indent=2)
-def process_single_question(document_url: str, question: str) -> str:
-    """Process single question with detailed output"""
-    if not document_url.strip():
-        return "Error: Document URL is required"
-    if not question.strip():
-        return "Error: Question is required"
-    try:
-        if not high_performance_system.index:
-            doc_result = high_performance_system.process_document_optimized(document_url)
-            if not doc_result.get('success'):
-                return f"Error: Document processing failed - {doc_result.get('error')}"
-        result = high_performance_system.process_single_query_optimized(question)
-        response = f"""Answer: {result['answer']}
-Quality Metrics:
-- Confidence Score: {result['confidence']:.3f}
-- Processing Time: {result['processing_time']:.2f}s
-- Token Usage: {result['token_count']} tokens
-- Source Chunks: {result['source_chunks']}
-Reasoning: {result['reasoning']}"""
-        return response
-    except Exception as e:
-        return f"Error: {str(e)}"
-# Gradio Interface
 with gr.Blocks(
-    title="🚀 High-Performance Document QA System",
-    theme=gr.themes.Soft(),
     css="""
-    .gradio-container {
-        max-width: 1200px !important;
-    }
-    .performance-highlight {
-        background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
-        color: white;
-        padding: 20px;
-        border-radius: 10px;
-        margin: 10px 0;
-    }
     """
 ) as demo:
-    gr.HTML("""
-    <div class="performance-highlight">
-        <h1>🚀 High-Performance Document QA System</h1>
-        <p><strong>Powered by Qwen2.5-3B-Instruct + MPNet Embeddings + RAG Pipeline</strong></p>
-        <p>Optimized for insurance, legal, HR, and compliance documents with 90-95% accuracy</p>
-    </div>
-    """)
-    with gr.Tab("🎯 Hackathon Submission"):
-        gr.Markdown("### Production-Ready Processing with State-of-the-Art Models")
-        gr.Markdown("**Current Models**: Qwen2.5-3B-Instruct (QA, unquantized) + all-mpnet-base-v2 (Embeddings)")
-        with gr.Row():
-            with gr.Column():
-                hack_url = gr.Textbox(
-                    label="📄 Document URL (PDF/DOCX)",
-                    placeholder="https://hackrx.blob.core.windows.net/assets/policy.pdf?...",
-                    lines=2
-                )
-                hack_questions = gr.Textbox(
-                    label="❓ Questions (JSON array or line-separated)",
-                    placeholder='["What is the grace period?", "What is the waiting period for PED?"]',
-                    lines=12
-                )
-                hack_submit = gr.Button("🚀 Process with High-Performance System", variant="primary", size="lg")
-            with gr.Column():
-                hack_output = gr.Textbox(
-                    label="📊 High-Performance JSON Response",
-                    lines=20,
-                    max_lines=30
-                )
-    with gr.Tab("🔍 Single Query Analysis"):
-        gr.Markdown("### Detailed Single Query Processing with Performance Metrics")
-        with gr.Row():
-            with gr.Column():
-                single_url = gr.Textbox(
-                    label="📄 Document URL",
-                    placeholder="https://example.com/document.pdf",
-                    lines=1
-                )
-                single_question = gr.Textbox(
-                    label="❓ Question",
-                    placeholder="What is the grace period for premium payment?",
-                    lines=3
-                )
-                single_button = gr.Button("🔍 Get Detailed Answer", variant="secondary", size="lg")
-            with gr.Column():
-                single_output = gr.Textbox(
-                    label="📋 Detailed Response with Metrics",
-                    lines=20,
-                    max_lines=30
-                )
-    hack_submit.click(
-        process_hackathon_submission,
         inputs=[hack_url, hack_questions],
-        outputs=[hack_output]
     )
-    single_button.click(
-        process_single_question,
         inputs=[single_url, single_question],
-        outputs=[single_output]
     )
-# Mount the app
 app = gr.mount_gradio_app(api_app, demo, path="/")
 if __name__ == "__main__":
-    logger.info("Starting High-Performance Document QA System...")
-    logger.info("Models: Qwen2.5-3B-Instruct (QA, unquantized) + all-mpnet-base-v2 (Embeddings)")
-    logger.info("Optimized for insurance, legal, HR, and compliance documents")
-    # THE CORRECTED CODE
-    uvicorn.run(app, host="0.0.0.0", port=7860, root_path="/")

 # Initialize the system
 high_performance_system = HighPerformanceSystem()
+def hackathon_wrapper(url, questions_text):
+    """Wrapper to show processing status for the hackathon tab."""
+    # Show status message
+    yield gr.Markdown("⏳ Processing... Please wait.", visible=True)
+    # Call the original function
+    result = process_hackathon_submission(url, questions_text)
+    # Hide status message and return the final result
+    yield gr.Markdown(visible=False), result
+def single_query_wrapper(url, question):
+    """Wrapper to show processing status for the single query tab."""
+    # Show status message
+    yield gr.Markdown("⏳ Processing... Please wait.", visible=True)
+    # Call the original function
+    result = process_single_question(url, question)
+    # Hide status message and return the final result
+    yield gr.Markdown(visible=False), result
+# --- New and Immensely Improved Gradio Interface ---
 with gr.Blocks(
+    theme=gr.themes.Monochrome(
+        primary_hue="indigo",
+        secondary_hue="blue",
+        neutral_hue="slate",
+        font=[gr.themes.GoogleFont("Inter"), "ui-sans-serif", "system-ui", "sans-serif"],
+    ),
     css="""
+        /* --- Custom CSS for a Professional Look --- */
+        :root {
+            --primary-color: #4f46e5;
+            --secondary-color: #1e40af;
+            --background-color: #f8fafc;
+            --card-background-color: #ffffff;
+            --text-color: #334155;
+            --border-color: #e2e8f0;
+            --shadow: 0 4px 6px -1px rgba(0, 0, 0, 0.1), 0 2px 4px -2px rgba(0, 0, 0, 0.1);
+            --border-radius: 12px;
+        }
+        .gradio-container { background-color: var(--background-color); }
+        .app-header {
+            text-align: center;
+            padding: 2rem;
+            color: white;
+            background: linear-gradient(135deg, var(--primary-color) 0%, var(--secondary-color) 100%);
+            border-radius: var(--border-radius);
+            margin-bottom: 2rem;
+        }
+        .app-header h1 { font-size: 2.5rem; font-weight: 700; margin-bottom: 0.5rem; }
+        .app-header p { font-size: 1.1rem; opacity: 0.9; }
+        .status-text { padding: 1rem !important; background-color: #e0e7ff !important; color: var(--primary-color) !important; border-radius: var(--border-radius) !important; text-align: center; }
+        .gr-box { border: none !important; box-shadow: var(--shadow) !important; border-radius: var(--border-radius) !important; }
+        .gr-button { border-radius: 8px !important; }
     """
 ) as demo:
+    # --- Header ---
+    with gr.Row():
+        gr.HTML("""
+        <div class="app-header">
+            <h1>🚀 High-Performance Document QA System</h1>
+            <p><strong>Powered by Qwen2.5-3B-Instruct + MPNet Embeddings + RAG Pipeline</strong></p>
+            <p>Optimized for insurance, legal, HR, and compliance documents.</p>
+        </div>
+        """)
+    # --- Main Content Area ---
+    with gr.Row(variant="panel"):
+        # --- Left Column: Inputs ---
+        with gr.Column(scale=1):
+            with gr.Tabs():
+                # --- Hackathon Submission Tab ---
+                with gr.Tab("🎯 Hackathon Submission", id=0):
+                    with gr.Box():
+                        gr.Markdown("### 1. Provide Document and Questions")
+                        hack_url = gr.Textbox(
+                            label="📄 Document URL (PDF/DOCX)",
+                            placeholder="Enter the public URL of the document...",
+                            lines=2
+                        )
+                        hack_questions = gr.Textbox(
+                            label="❓ Questions (JSON array or one per line)",
+                            placeholder='["What is the grace period?", "Is maternity covered?"]',
+                            lines=8
+                        )
+                        gr.Examples(
+                            examples=[
+                                [
+                                    "https://hackrx.blob.core.windows.net/assets/policy.pdf?sp=r&st=2024-07-28T17:58:36Z&se=2024-08-05T01:58:36Z&spr=https&sv=2022-11-02&sr=b&sig=P3mH1m6xY95UPp5qT24l6j2l9V82p8vGEx2tTQP4fF0%3D",
+                                    '["What is the grace period for premium payment?","What is the waiting period for Pre-existing Diseases?","is maternity covered in this policy?"]'
+                                ]
+                            ],
+                            inputs=[hack_url, hack_questions]
+                        )
+                        with gr.Row():
+                            hack_clear_btn = gr.Button("Clear", variant="secondary")
+                            hack_submit_btn = gr.Button("🚀 Process Submission", variant="primary")
+                        hack_status = gr.Markdown(visible=False, elem_classes="status-text")
+                # --- Single Query Analysis Tab ---
+                with gr.Tab("🔍 Single Query Analysis", id=1):
+                    with gr.Box():
+                        gr.Markdown("### 1. Provide Document and a Question")
+                        single_url = gr.Textbox(
+                            label="📄 Document URL",
+                            placeholder="Enter the public URL of the document...",
+                            lines=2
+                        )
+                        single_question = gr.Textbox(
+                            label="❓ Your Question",
+                            placeholder="What is the waiting period for cataract surgery?",
+                            lines=5
+                        )
+                        with gr.Row():
+                            single_clear_btn = gr.Button("Clear", variant="secondary")
+                            single_submit_btn = gr.Button("🔍 Get Detailed Answer", variant="primary")
+                        single_status = gr.Markdown(visible=False, elem_classes="status-text")
+        # --- Right Column: Outputs ---
+        with gr.Column(scale=2):
+            with gr.Tabs():
+                with gr.Tab("✅ Results", id=2):
+                    with gr.Box():
+                        gr.Markdown("### 2. View the Results")
+                        hack_output = gr.Textbox(
+                            label="📊 Hackathon JSON Response",
+                            lines=20,
+                            max_lines=30,
+                            interactive=False
+                        )
+                        single_output = gr.Textbox(
+                            label="📋 Detailed Single Query Response",
+                            lines=20,
+                            max_lines=30,
+                            interactive=False
+                        )
+    # --- Event Handlers ---
+    # Hackathon Tab Logic
+    hack_submit_btn.click(
+        fn=hackathon_wrapper,
         inputs=[hack_url, hack_questions],
+        outputs=[hack_status, hack_output],
+        # Hide the other output box
+        js="""
+        () => {
+            const singleQueryTab = document.getElementById('tab_single_query_output');
+            if (singleQueryTab) {
+                singleQueryTab.style.display = 'none';
+            }
+            const hackathonTab = document.getElementById('tab_hackathon_output');
+            if (hackathonTab) {
+                hackathonTab.style.display = 'block';
+            }
+        }
+        """
     )
+    hack_clear_btn.click(lambda: (None, None, None, gr.Markdown(visible=False)), outputs=[hack_url, hack_questions, hack_output, hack_status])
+    # Single Query Tab Logic
+    single_submit_btn.click(
+        fn=single_query_wrapper,
         inputs=[single_url, single_question],
+        outputs=[single_status, single_output],
+        # Hide the other output box
+        js="""
+        () => {
+            const hackathonTab = document.getElementById('tab_hackathon_output');
+            if (hackathonTab) {
+                hackathonTab.style.display = 'none';
+            }
+            const singleQueryTab = document.getElementById('tab_single_query_output');
+            if (singleQueryTab) {
+                singleQueryTab.style.display = 'block';
+            }
+        }
+        """
     )
+    single_clear_btn.click(lambda: (None, None, None, gr.Markdown(visible=False)), outputs=[single_url, single_question, single_output, single_status])
+    # Logic to only show one output at a time based on which button was last clicked
+    # This requires giving the output Textbox components an `elem_id` to be targeted by JS
+    hack_output.elem_id = "tab_hackathon_output"
+    single_output.elem_id = "tab_single_query_output"
 app = gr.mount_gradio_app(api_app, demo, path="/")
 if __name__ == "__main__":
+    # We run this single, combined 'app' instance on port 7860.
+    # This is the correct way to run a combined app on a single public port.
+    # It ensures that both your API endpoints and your Gradio frontend
+    # are served from the same server and are both accessible.
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)