Spaces:

ChAbhishek28
/

PensionBot

Runtime error

App Files Files Community

ChAbhishek28 commited on Oct 10, 2025

Commit

a1986d7

1 Parent(s): 548a99d

Improve response formatting for better readability with proper spacing and bullet points

Browse files

Files changed (1) hide show

groq_websocket_handler.py +60 -52

groq_websocket_handler.py CHANGED Viewed

@@ -10,6 +10,7 @@ import asyncio
 import tempfile
 import os
 import time
 from typing import Dict, Any, Optional
 from pathlib import Path
 import uuid
@@ -798,63 +799,70 @@ class GroqWebSocketHandler:
             return response_text[:200] + "..." if len(response_text) > 200 else response_text
     def _apply_rajasthan_formatting(self, query: str, response_text: str) -> str:
-        """Apply Rajasthan government-specific formatting to responses"""
         try:
-            # Detect query language to avoid unnecessary Hindi formatting
-            query_language = self.hybrid_llm.detect_language(query)
-            query_lower = query.lower()
-            # For English queries, apply minimal formatting
-            if query_language == "english":
-                # Just highlight important terms in English only
-                highlighted = self.rajasthan_formatter.highlight_important_terms(response_text, language="english")
-                return highlighted
-            # Check if it's a procedure-related query
-            if any(keyword in query_lower for keyword in ['procedure', 'process', 'steps', 'how to', 'apply', 'प्रक्रिया', 'कैसे']):
-                # Extract procedure information from response
-                procedure_info = {
-                    'name': self._extract_procedure_name(query, response_text),
-                    'steps': self._extract_steps(response_text),
-                    'eligibility': self._extract_eligibility(response_text),
-                    'fees': self._extract_fees(response_text),
-                    'processing_time': self._extract_processing_time(response_text),
-                    'office': self._extract_office_info(response_text)
-                }
-                # Apply procedure formatting if we have enough info
-                if len(procedure_info['steps']) > 0:
-                    formatted = self.rajasthan_formatter.format_procedure_response(procedure_info)
-                    return self.rajasthan_formatter.add_rajasthan_context(formatted)
-            # Check if it's a circular/policy query
-            elif any(keyword in query_lower for keyword in ['circular', 'policy', 'rule', 'परिपत्र', 'नीति', 'नियम']):
-                # Extract circular information
-                circular_info = {
-                    'department': self._detect_department(response_text),
-                    'subject': query,
-                    'date': time.strftime('%d/%m/%Y'),
-                    'circular_no': self._extract_circular_number(response_text)
-                }
-                formatted = self.rajasthan_formatter.format_circular_response(response_text, circular_info)
-                return self.rajasthan_formatter.add_rajasthan_context(formatted)
-            # For calculation queries, format calculation steps
-            elif any(keyword in query_lower for keyword in ['calculate', 'calculation', 'amount', 'गणना', 'राशि']):
-                formatted = self.rajasthan_formatter.format_calculation_steps(response_text)
-                return self.rajasthan_formatter.add_rajasthan_context(formatted)
-            # General formatting for all responses
-            else:
-                # Apply highlighting and context
-                highlighted = self.rajasthan_formatter.highlight_important_terms(response_text)
-                return self.rajasthan_formatter.add_rajasthan_context(highlighted)
         except Exception as e:
             logger.error(f"❌ Error applying Rajasthan formatting: {e}")
             # Fallback to basic context addition
-            return self.rajasthan_formatter.add_rajasthan_context(response_text)
     def _extract_procedure_name(self, query: str, response: str) -> str:
         """Extract procedure name from query or response"""

 import tempfile
 import os
 import time
+import re
 from typing import Dict, Any, Optional
 from pathlib import Path
 import uuid
             return response_text[:200] + "..." if len(response_text) > 200 else response_text
     def _apply_rajasthan_formatting(self, query: str, response_text: str) -> str:
+        """Apply clean, readable Rajasthan government-specific formatting to responses"""
         try:
+            # Simple, readable formatting approach
+            return self._format_for_readability(response_text)
         except Exception as e:
             logger.error(f"❌ Error applying Rajasthan formatting: {e}")
             # Fallback to basic context addition
+            return response_text
+    def _format_for_readability(self, text: str) -> str:
+        """Format text for better readability with proper spacing and structure"""
+        try:
+            # Clean up the text first
+            text = text.strip()
+            # Split into sentences and clean up
+            sentences = text.split('. ')
+            formatted_sentences = []
+            current_section = ""
+            for sentence in sentences:
+                sentence = sentence.strip()
+                if not sentence:
+                    continue
+                # Add period if missing
+                if not sentence.endswith(('.', '!', '?', ':', '।')):
+                    sentence += '.'
+                # Check if this looks like a section header or important point
+                if any(marker in sentence.lower() for marker in [
+                    'eligibility criteria', 'minimum service', 'voluntary retirement',
+                    'family pension', 'gratuity', 'commutation', 'basic pay',
+                    'service pension', 'medical benefits', 'pension limitations'
+                ]):
+                    # This is an important point - format as bullet
+                    formatted_sentences.append(f"\n• **{sentence}**")
+                elif sentence.startswith(('The ', 'This ', 'It ', 'These ', 'Those ')):
+                    # Main explanation sentence
+                    formatted_sentences.append(f"\n{sentence}")
+                elif any(char.isdigit() for char in sentence[:10]):
+                    # Might contain numbers/dates - format as bullet
+                    formatted_sentences.append(f"\n• {sentence}")
+                else:
+                    # Regular sentence
+                    formatted_sentences.append(sentence)
+            # Join all sentences
+            formatted_text = ' '.join(formatted_sentences)
+            # Add proper spacing after bullets and sections
+            formatted_text = re.sub(r'\n•', '\n\n•', formatted_text)
+            formatted_text = re.sub(r'\*\*([^*]+)\*\*', r'**\1**\n', formatted_text)
+            # Clean up multiple newlines
+            formatted_text = re.sub(r'\n{3,}', '\n\n', formatted_text)
+            return formatted_text.strip()
+        except Exception as e:
+            logger.error(f"❌ Error in readability formatting: {e}")
+            return text
     def _extract_procedure_name(self, query: str, response: str) -> str:
         """Extract procedure name from query or response"""