Spaces:

ChAbhishek28
/

PensionBot

Runtime error

App Files Files Community

ChAbhishek28 commited on Oct 3, 2025

Commit

4a1bc78

1 Parent(s): 9341027

Add 89999999999999999999999999

Browse files

Files changed (2) hide show

enhanced_websocket_handler.py +77 -9
rag_service.py +271 -30

enhanced_websocket_handler.py CHANGED Viewed

@@ -27,15 +27,48 @@ hybrid_llm_service = HybridLLMService()
 logger = logging.getLogger("voicebot")
 def analyze_query_context(query: str) -> dict:
-    """Analyze query to determine if it's document-related or general"""
     query_lower = query.lower()
-    # Government document keywords
     doc_keywords = [
         'pension', 'leave', 'allowance', 'da', 'dearness', 'procurement', 'tender',
         'medical', 'reimbursement', 'transfer', 'posting', 'promotion', 'service',
         'rules', 'policy', 'government', 'circular', 'notification', 'benefits',
-        'gratuity', 'provident fund', 'retirement', 'salary', 'pay commission'
     ]
     # General conversation keywords
@@ -45,14 +78,26 @@ def analyze_query_context(query: str) -> dict:
         'time', 'date', 'joke', 'story', 'song', 'recipe', 'movie'
     ]
-    # Count matches
     doc_matches = sum(1 for kw in doc_keywords if kw in query_lower)
     general_matches = sum(1 for kw in general_keywords if kw in query_lower)
     # Determine query type
-    if doc_matches > 0:
         query_type = "document_related"
-        confidence = min(doc_matches * 0.3, 1.0)
     elif general_matches > 0:
         query_type = "general_conversation"
         confidence = min(general_matches * 0.4, 1.0)
@@ -67,7 +112,9 @@ def analyze_query_context(query: str) -> dict:
         "type": query_type,
         "confidence": confidence,
         "doc_keywords_found": doc_matches,
-        "general_keywords_found": general_matches
     }
 async def generate_llm_fallback_response(user_message: str, query_context: dict) -> str:
@@ -76,12 +123,33 @@ async def generate_llm_fallback_response(user_message: str, query_context: dict)
         # Determine which LLM to use based on query complexity
         provider = hybrid_llm_service.choose_llm_provider(user_message)
-        # Create appropriate system prompt based on query type
         if query_context.get("type") == "general_conversation":
             system_prompt = """You are a helpful assistant for a government document system.
             The user is asking a general question not related to government documents.
             Provide a friendly, helpful response and gently guide them to ask about government policies,
-            pension rules, leave policies, or other administrative matters if they need official information."""
         else:
             system_prompt = """You are an AI assistant for government document queries.
             The user asked about something that wasn't found in the document database.

 logger = logging.getLogger("voicebot")
 def analyze_query_context(query: str) -> dict:
+    """Analyze query to determine if it's document-related or general, and identify user role"""
     query_lower = query.lower()
+    # Role-specific keywords and queries
+    role_patterns = {
+        'pension_beneficiary': [
+            'pension eligibility', 'pension documents', 'pension application', 'retirement benefits',
+            'pension calculation', 'pension amount', 'family pension', 'commutation',
+            'gratuity eligibility', 'provident fund withdrawal', 'medical benefits after retirement',
+            'pension certificate', 'life certificate', 'pension arrears', 'how to apply pension',
+            'pension office', 'pension disbursement', 'pension inquiry', 'pension status'
+        ],
+        'procurement_officer': [
+            'tender process', 'bid submission', 'procurement thresholds', 'gem portal',
+            'msme relaxation', 'vendor registration', 'procurement checklist', 'bid evaluation',
+            'tender documents', 'procurement rules', 'bidding process', 'contract award',
+            'procurement guidelines', 'tender notice', 'technical bid', 'financial bid',
+            'procurement manual', 'vendor empanelment', 'tender committee'
+        ],
+        'finance_staff': [
+            'sanctioning authority', 'financial approval', 'budget allocation', 'expenditure sanction',
+            'financial registers', 'audit compliance', 'treasury rules', 'payment authorization',
+            'financial delegation', 'budget utilization', 'fund release', 'financial procedure',
+            'accounting rules', 'financial reporting', 'expenditure control', 'financial audit',
+            'cash book', 'voucher processing', 'financial clearance'
+        ],
+        'leadership_policymaker': [
+            'policy impact', 'scenario analysis', 'cost comparison', 'policy implementation',
+            'evidence pack', 'policy evaluation', 'impact assessment', 'strategic planning',
+            'policy formulation', 'comparative analysis', 'policy review', 'governance framework',
+            'administrative reform', 'policy effectiveness', 'decision support', 'policy brief'
+        ]
+    }
+    # Government document keywords (expanded)
     doc_keywords = [
         'pension', 'leave', 'allowance', 'da', 'dearness', 'procurement', 'tender',
         'medical', 'reimbursement', 'transfer', 'posting', 'promotion', 'service',
         'rules', 'policy', 'government', 'circular', 'notification', 'benefits',
+        'gratuity', 'provident fund', 'retirement', 'salary', 'pay commission',
+        'eligibility', 'documents', 'application', 'process', 'approval', 'sanction',
+        'audit', 'finance', 'budget', 'expenditure', 'treasury', 'guidelines'
     ]
     # General conversation keywords
         'time', 'date', 'joke', 'story', 'song', 'recipe', 'movie'
     ]
+    # Detect user role
+    detected_role = None
+    role_confidence = 0.0
+    for role, patterns in role_patterns.items():
+        role_matches = sum(1 for pattern in patterns if pattern in query_lower)
+        if role_matches > 0:
+            current_confidence = min(role_matches * 0.4, 1.0)
+            if current_confidence > role_confidence:
+                detected_role = role
+                role_confidence = current_confidence
+    # Count general matches
     doc_matches = sum(1 for kw in doc_keywords if kw in query_lower)
     general_matches = sum(1 for kw in general_keywords if kw in query_lower)
     # Determine query type
+    if doc_matches > 0 or detected_role:
         query_type = "document_related"
+        confidence = max(min(doc_matches * 0.3, 1.0), role_confidence)
     elif general_matches > 0:
         query_type = "general_conversation"
         confidence = min(general_matches * 0.4, 1.0)
         "type": query_type,
         "confidence": confidence,
         "doc_keywords_found": doc_matches,
+        "general_keywords_found": general_matches,
+        "detected_role": detected_role,
+        "role_confidence": role_confidence
     }
 async def generate_llm_fallback_response(user_message: str, query_context: dict) -> str:
         # Determine which LLM to use based on query complexity
         provider = hybrid_llm_service.choose_llm_provider(user_message)
+        # Create role-aware system prompt
+        detected_role = query_context.get("detected_role")
         if query_context.get("type") == "general_conversation":
             system_prompt = """You are a helpful assistant for a government document system.
             The user is asking a general question not related to government documents.
             Provide a friendly, helpful response and gently guide them to ask about government policies,
+            pension rules, leave policies, procurement procedures, or other administrative matters if they need official information."""
+        elif detected_role == "pension_beneficiary":
+            system_prompt = """You are an AI assistant specializing in government pension and retirement benefits.
+            The user appears to be a pension beneficiary or claimant. Provide helpful information about pension eligibility,
+            application processes, required documents, and procedures. Always remind them to verify information with
+            the pension disbursing authority and consult official government sources for the most current rules."""
+        elif detected_role == "procurement_officer":
+            system_prompt = """You are an AI assistant specializing in government procurement procedures.
+            The user appears to be involved in procurement or bidding processes. Provide helpful information about
+            tender procedures, MSME benefits, GeM portal usage, and procurement guidelines. Always remind them to
+            follow current procurement rules and consult the latest government circulars."""
+        elif detected_role == "finance_staff":
+            system_prompt = """You are an AI assistant specializing in government financial procedures.
+            The user appears to be finance staff. Provide helpful information about sanctioning procedures,
+            budget management, audit compliance, and treasury rules. Always remind them to follow current
+            financial rules and consult with the accounts department for official procedures."""
+        elif detected_role == "leadership_policymaker":
+            system_prompt = """You are an AI assistant specializing in policy analysis and decision support.
+            The user appears to be in a leadership or policy-making role. Provide helpful information about
+            policy impact analysis, evidence-based decision making, and strategic planning. Always recommend
+            consulting with relevant departments and conducting proper stakeholder consultations."""
         else:
             system_prompt = """You are an AI assistant for government document queries.
             The user asked about something that wasn't found in the document database.

rag_service.py CHANGED Viewed

@@ -11,6 +11,149 @@ import asyncio
 logger = logging.getLogger("voicebot")
 # Fallback content for when database is empty
 FALLBACK_CONTENT = {
     "pension": """Pension is a regular payment made during a person's retirement from an investment fund. For government employees in India, pension includes:
@@ -47,7 +190,42 @@ DA 6% Increment Impact:
    - Monthly credit via NEFT
 3. Benefits include pension, gratuity, and provident fund
-4. Enhanced benefits for teachers and staff"""
 }
 def get_fallback_content(query: str) -> List[Dict[str, Any]]:
@@ -129,6 +307,22 @@ def get_fallback_content(query: str) -> List[Dict[str, Any]]:
                 "Obtain necessary approvals",
                 "Maintain leave records"
             ]
         else:
             fallback_text = f"I understand you're asking about '{query}'. While I don't have specific documents loaded for this query, I can help with government policies, pension rules, allowances, and administrative procedures. Please try rephrasing your question or ask about specific government benefits."
             checklist = [
@@ -199,8 +393,40 @@ async def search_documents_async(query: str, limit: int = 5) -> List[Dict[str, A
         # Enhance query for better relevance based on category
         enhanced_query = query
-        # Pension queries
-        if "pension" in query_lower:
             if any(word in query_lower for word in ["changes", "impact", "rules"]):
                 enhanced_query = f"{query} pension rules retirement benefits modifications"
             elif "calculation" in query_lower or "formula" in query_lower:
@@ -225,6 +451,18 @@ async def search_documents_async(query: str, limit: int = 5) -> List[Dict[str, A
         # Transfer queries
         elif any(word in query_lower for word in ["transfer", "posting"]):
             enhanced_query = f"{query} transfer posting policy rules"
         logger.info(f"🔍 Enhanced query: '{enhanced_query}' (original: '{query}')")
@@ -265,8 +503,19 @@ async def search_documents_async(query: str, limit: int = 5) -> List[Dict[str, A
             # Calculate relevance score based on query intent
             relevance_score = getattr(doc, 'score', 0.5)  # Base score
-            # Define query categories and their keywords
             query_categories = {
                 'pension': ['pension', 'retirement', 'gratuity', 'provident fund', 'gpf', 'cpf', 'superannuation'],
                 'leave': ['leave', 'casual leave', 'earned leave', 'medical leave', 'maternity', 'paternity'],
                 'allowance': ['allowance', 'dearness allowance', 'da', 'hra', 'house rent', 'travel allowance', 'increment'],
@@ -274,11 +523,22 @@ async def search_documents_async(query: str, limit: int = 5) -> List[Dict[str, A
                 'medical': ['medical', 'health', 'treatment', 'reimbursement', 'cghs', 'hospital'],
                 'transfer': ['transfer', 'posting', 'deputation', 'cadre'],
                 'promotion': ['promotion', 'seniority', 'grade', 'advancement', 'career progression'],
-                'service': ['service', 'conduct', 'discipline', 'rules', 'regulation']
             }
-            # Content categories - what each document type contains
             content_categories = {
                 'pension': ['pension', 'retirement', 'gratuity', 'provident fund', 'superannuation', 'benefits'],
                 'leave': ['leave', 'casual', 'earned', 'medical leave', 'maternity'],
                 'allowance': ['allowance', 'dearness', 'house rent', 'travel', 'da', 'hra', 'increment'],
@@ -286,6 +546,9 @@ async def search_documents_async(query: str, limit: int = 5) -> List[Dict[str, A
                 'medical': ['medical', 'health', 'cghs', 'reimbursement', 'treatment'],
                 'transfer': ['transfer', 'posting', 'deputation', 'cadre'],
                 'promotion': ['promotion', 'seniority', 'grade pay', 'advancement'],
                 'service': ['service rules', 'conduct', 'discipline', 'misconduct']
             }
@@ -334,30 +597,8 @@ async def search_documents_async(query: str, limit: int = 5) -> List[Dict[str, A
             clause_text = doc.page_content
             # Simple extractive summary: first sentence or up to 2 lines
             summary = clause_text.split(". ")[0][:180] + ("..." if len(clause_text) > 180 else "")
-            # Role-aware checklist logic (basic template)
-            role_checklist = []
-            query_lower = query.lower()
-            if "pension" in query_lower:
-                role_checklist = [
-                    "Check eligibility (service years, misconduct)",
-                    "Collect required documents (service book, ID, proof)",
-                    "Obtain approvals (sanctioning authority)",
-                    "Submit application to pension office"
-                ]
-            elif "procurement" in query_lower or "bid" in query_lower:
-                role_checklist = [
-                    "Review procurement thresholds and MSME relaxations",
-                    "Prepare bid documents",
-                    "Complete registration and approvals",
-                    "Submit bid before deadline"
-                ]
-            elif "finance" in query_lower:
-                role_checklist = [
-                    "Check sanctioning steps",
-                    "Update registers",
-                    "Obtain necessary approvals",
-                    "Notify stakeholders"
-                ]
             results.append({
                 "clause_text": clause_text,
                 "summary": summary,

 logger = logging.getLogger("voicebot")
+def generate_role_based_checklist(query: str, content: str) -> list:
+    """Generate role-specific checklists based on query and content"""
+    query_lower = query.lower()
+    content_lower = content.lower() if content else ""
+    # Pension Beneficiaries & Claimants
+    if any(phrase in query_lower for phrase in ['pension eligibility', 'pension documents', 'how to apply pension', 'pension application']):
+        return [
+            "Verify service eligibility (minimum 10 years qualifying service)",
+            "Gather required documents (service book, PPO, identity proof)",
+            "Check for any departmental proceedings or vigilance cases",
+            "Apply through proper channel 6 months before retirement",
+            "Follow up with pension disbursing authority for processing"
+        ]
+    elif any(phrase in query_lower for phrase in ['family pension', 'widow pension', 'dependent pension']):
+        return [
+            "Obtain death certificate and service documents of deceased employee",
+            "Submit family pension application with nominee details",
+            "Provide proof of relationship and dependency",
+            "Get certificate from employer about last drawn salary",
+            "Register with pension disbursing bank for regular payments"
+        ]
+    elif 'pension calculation' in query_lower or 'pension amount' in query_lower:
+        return [
+            "Collect last pay certificate with basic pay and DA details",
+            "Calculate qualifying service excluding breaks/suspensions",
+            "Apply pension formula: (Last pay × service years) ÷ 70",
+            "Check for minimum pension ceiling and DA applicability",
+            "Verify commutation options if considering lump sum"
+        ]
+    # Procurement Officers & Bidders
+    elif any(phrase in query_lower for phrase in ['tender process', 'bid submission', 'procurement threshold']):
+        return [
+            "Verify procurement threshold limits and delegation of powers",
+            "Check MSME purchase preference and price benefits applicable",
+            "Ensure technical specifications are non-discriminatory",
+            "Follow mandatory e-procurement process through GeM/portal",
+            "Maintain proper documentation for audit trail"
+        ]
+    elif any(phrase in query_lower for phrase in ['msme relaxation', 'msme benefits']):
+        return [
+            "Verify MSME registration certificate validity",
+            "Apply 15% price preference for MSME quotes",
+            "Check exemption from EMD (Earnest Money Deposit)",
+            "Ensure MSME gets advance payment facility if applicable",
+            "Follow tender splitting norms for MSME participation"
+        ]
+    elif any(phrase in query_lower for phrase in ['gem portal', 'vendor registration']):
+        return [
+            "Complete vendor registration on Government e-Marketplace",
+            "Upload all required business documents and certificates",
+            "Get product/service catalog approved by GeM",
+            "Maintain competitive pricing and service ratings",
+            "Respond promptly to buyer inquiries and orders"
+        ]
+    # Finance Staff
+    elif any(phrase in query_lower for phrase in ['sanctioning authority', 'financial approval', 'expenditure sanction']):
+        return [
+            "Verify delegated financial powers and approval limits",
+            "Check budget provision and availability of funds",
+            "Ensure compliance with financial rules and procedures",
+            "Obtain necessary pre-audit clearance if required",
+            "Maintain proper accounting and audit trail"
+        ]
+    elif any(phrase in query_lower for phrase in ['budget allocation', 'fund release']):
+        return [
+            "Verify budget allocation in approved estimates",
+            "Check fund availability in treasury/bank account",
+            "Ensure proper budget head classification",
+            "Follow fund release schedule and priority guidelines",
+            "Update budget utilization registers promptly"
+        ]
+    elif any(phrase in query_lower for phrase in ['audit compliance', 'financial audit']):
+        return [
+            "Maintain all vouchers and supporting documents",
+            "Ensure transactions are recorded in proper registers",
+            "Respond to audit queries within stipulated time",
+            "Implement audit recommendations and report compliance",
+            "Conduct internal audit and review before external audit"
+        ]
+    # Leadership & Policymakers
+    elif any(phrase in query_lower for phrase in ['policy impact', 'scenario analysis']):
+        return [
+            "Gather baseline data and impact measurement parameters",
+            "Conduct stakeholder consultation and feedback analysis",
+            "Prepare cost-benefit analysis for different scenarios",
+            "Assess implementation feasibility and resource requirements",
+            "Develop monitoring and evaluation framework"
+        ]
+    elif any(phrase in query_lower for phrase in ['evidence pack', 'policy brief']):
+        return [
+            "Compile relevant policy documents and legal framework",
+            "Gather statistical data and trend analysis",
+            "Include comparative analysis from other states/countries",
+            "Prepare executive summary with key recommendations",
+            "Ensure all sources are cited and verifiable"
+        ]
+    # General categories with enhanced checklists
+    elif "pension" in query_lower:
+        return [
+            "Check eligibility criteria and service requirements",
+            "Collect required documents (service book, PPO, ID proof)",
+            "Obtain necessary approvals and clearances",
+            "Submit application through proper channel",
+            "Follow up with pension office for processing status"
+        ]
+    elif any(word in query_lower for word in ["procurement", "tender", "bid"]):
+        return [
+            "Review procurement guidelines and threshold limits",
+            "Check MSME relaxations and price preferences",
+            "Prepare comprehensive bid documents",
+            "Ensure compliance with technical specifications",
+            "Submit bid through approved e-procurement platform"
+        ]
+    elif any(word in query_lower for word in ["finance", "budget", "expenditure"]):
+        return [
+            "Verify financial delegation and approval limits",
+            "Check budget provision and fund availability",
+            "Ensure compliance with treasury and accounting rules",
+            "Maintain proper documentation for audit",
+            "Update financial registers and reports"
+        ]
+    elif "leave" in query_lower:
+        return [
+            "Check leave balance and entitlement",
+            "Follow prescribed application procedure",
+            "Obtain necessary approvals from competent authority",
+            "Arrange work coverage during leave period",
+            "Update attendance records upon return"
+        ]
+    else:
+        return [
+            "Review relevant policy guidelines and procedures",
+            "Consult with appropriate authorities if needed",
+            "Ensure compliance with applicable rules",
+            "Maintain proper documentation",
+            "Seek clarification for any doubts"
+        ]
 # Fallback content for when database is empty
 FALLBACK_CONTENT = {
     "pension": """Pension is a regular payment made during a person's retirement from an investment fund. For government employees in India, pension includes:
    - Monthly credit via NEFT
 3. Benefits include pension, gratuity, and provident fund
+4. Enhanced benefits for teachers and staff""",
+    "procurement": """Government Procurement Guidelines:
+1. Threshold Limits:
+   - Goods: ₹25,000 to ₹25 lakh (departmental purchase committee)
+   - Works: ₹1 lakh to ₹5 crore (various committees)
+   - Services: As per delegation of powers
+2. MSME Benefits:
+   - 15% price preference in competitive bids
+   - Exemption from EMD (Earnest Money Deposit)
+   - No tender fee for MSME enterprises
+   - Advance payment facility available
+3. GeM Portal Usage:
+   - Mandatory for central government purchases
+   - Direct purchase up to ₹5 lakh
+   - Rate contract for common items""",
+    "finance": """Financial Management Guidelines:
+1. Sanctioning Authority:
+   - As per delegation of financial powers
+   - Budget provision must be available
+   - Pre-audit clearance where required
+2. Documentation:
+   - All expenditure must have proper vouchers
+   - Budget registers to be maintained
+   - Audit trail for all transactions
+3. Treasury Rules:
+   - Follow prescribed payment procedures
+   - Maintain cash book and other registers
+   - Submit periodic returns and statements"""
 }
 def get_fallback_content(query: str) -> List[Dict[str, Any]]:
                 "Obtain necessary approvals",
                 "Maintain leave records"
             ]
+        elif any(word in query_lower for word in ["audit", "financial", "budget", "expenditure", "accounts"]):
+            fallback_text = f"Regarding your query about '{query}', government financial audits and accounts are typically maintained at departmental and central levels. Financial audits cover budget utilization, expenditure patterns, and compliance with financial rules. For specific audit reports, you would need to access official government finance portals or contact the concerned audit department."
+            checklist = [
+                "Contact Controller and Auditor General (CAG) office",
+                "Check government finance portals for audit reports",
+                "Request specific financial year audit documents",
+                "Verify with concerned department's accounts section"
+            ]
+        elif any(word in query_lower for word in ["training", "development", "skill", "course"]):
+            fallback_text = f"Regarding your query about '{query}', government training and development programs are designed to enhance employee capabilities. These include induction training, skill development courses, leadership programs, and specialized technical training through various government training institutes."
+            checklist = [
+                "Check available training programs in your department",
+                "Contact training institutes for course details",
+                "Apply for relevant skill development programs",
+                "Utilize online learning platforms like iGOT Karmayogi"
+            ]
         else:
             fallback_text = f"I understand you're asking about '{query}'. While I don't have specific documents loaded for this query, I can help with government policies, pension rules, allowances, and administrative procedures. Please try rephrasing your question or ask about specific government benefits."
             checklist = [
         # Enhance query for better relevance based on category
         enhanced_query = query
+        # Role-specific query enhancement
+        # Pension Beneficiary queries
+        if any(word in query_lower for word in ["pension eligibility", "pension documents", "how to apply pension", "pension certificate"]):
+            enhanced_query = f"{query} pension eligibility documents application process beneficiary requirements"
+        elif any(word in query_lower for word in ["family pension", "widow pension", "dependent pension"]):
+            enhanced_query = f"{query} family pension eligibility widow dependent benefits"
+        elif any(word in query_lower for word in ["pension calculation", "pension amount", "pension formula"]):
+            enhanced_query = f"{query} pension calculation formula amount computation service years"
+        # Procurement Officer queries
+        elif any(word in query_lower for word in ["tender process", "bid submission", "procurement threshold"]):
+            enhanced_query = f"{query} procurement tender bidding process thresholds guidelines"
+        elif any(word in query_lower for word in ["msme relaxation", "msme benefits", "small scale industry"]):
+            enhanced_query = f"{query} msme relaxation benefits procurement small scale industry"
+        elif any(word in query_lower for word in ["gem portal", "vendor registration", "vendor empanelment"]):
+            enhanced_query = f"{query} gem portal vendor registration empanelment process"
+        # Finance Staff queries
+        elif any(word in query_lower for word in ["sanctioning authority", "financial approval", "expenditure sanction"]):
+            enhanced_query = f"{query} sanctioning authority financial approval expenditure delegation"
+        elif any(word in query_lower for word in ["budget allocation", "fund release", "treasury"]):
+            enhanced_query = f"{query} budget allocation fund release treasury rules procedures"
+        elif any(word in query_lower for word in ["audit compliance", "financial audit", "audit report"]):
+            enhanced_query = f"{query} audit compliance financial audit reporting procedures"
+        # Leadership/Policymaker queries
+        elif any(word in query_lower for word in ["policy impact", "scenario analysis", "comparative analysis"]):
+            enhanced_query = f"{query} policy impact scenario analysis comparison evidence"
+        elif any(word in query_lower for word in ["evidence pack", "policy brief", "decision support"]):
+            enhanced_query = f"{query} evidence pack policy brief decision support documentation"
+        # General category queries
+        elif "pension" in query_lower:
             if any(word in query_lower for word in ["changes", "impact", "rules"]):
                 enhanced_query = f"{query} pension rules retirement benefits modifications"
             elif "calculation" in query_lower or "formula" in query_lower:
         # Transfer queries
         elif any(word in query_lower for word in ["transfer", "posting"]):
             enhanced_query = f"{query} transfer posting policy rules"
+        # Audit and financial queries
+        elif any(word in query_lower for word in ["audit", "financial", "budget", "expenditure", "accounts", "finance"]):
+            enhanced_query = f"{query} audit financial budget expenditure accounts"
+        # Training and development queries
+        elif any(word in query_lower for word in ["training", "development", "course", "skill"]):
+            enhanced_query = f"{query} training development skill course capacity building"
+        # Salary and pay queries
+        elif any(word in query_lower for word in ["salary", "pay", "grade", "scale"]):
+            enhanced_query = f"{query} salary pay grade scale compensation"
         logger.info(f"🔍 Enhanced query: '{enhanced_query}' (original: '{query}')")
             # Calculate relevance score based on query intent
             relevance_score = getattr(doc, 'score', 0.5)  # Base score
+            # Define query categories and their keywords (including role-specific)
             query_categories = {
+                'pension_beneficiary': ['pension eligibility', 'pension documents', 'pension application', 'pension certificate',
+                                      'family pension', 'pension calculation', 'how to apply pension', 'pension office',
+                                      'life certificate', 'pension arrears', 'commutation', 'gratuity eligibility'],
+                'procurement_officer': ['tender process', 'bid submission', 'procurement threshold', 'gem portal',
+                                      'msme relaxation', 'vendor registration', 'procurement checklist', 'bid evaluation',
+                                      'tender documents', 'bidding process', 'contract award', 'vendor empanelment'],
+                'finance_staff': ['sanctioning authority', 'financial approval', 'budget allocation', 'expenditure sanction',
+                                'financial registers', 'audit compliance', 'treasury rules', 'payment authorization',
+                                'financial delegation', 'fund release', 'financial procedure', 'voucher processing'],
+                'leadership_policymaker': ['policy impact', 'scenario analysis', 'evidence pack', 'policy brief',
+                                         'comparative analysis', 'decision support', 'policy evaluation', 'impact assessment'],
                 'pension': ['pension', 'retirement', 'gratuity', 'provident fund', 'gpf', 'cpf', 'superannuation'],
                 'leave': ['leave', 'casual leave', 'earned leave', 'medical leave', 'maternity', 'paternity'],
                 'allowance': ['allowance', 'dearness allowance', 'da', 'hra', 'house rent', 'travel allowance', 'increment'],
                 'medical': ['medical', 'health', 'treatment', 'reimbursement', 'cghs', 'hospital'],
                 'transfer': ['transfer', 'posting', 'deputation', 'cadre'],
                 'promotion': ['promotion', 'seniority', 'grade', 'advancement', 'career progression'],
+                'service': ['service', 'conduct', 'discipline', 'rules', 'regulation'],
+                'audit': ['audit', 'financial', 'budget', 'expenditure', 'accounts', 'finance', 'yearly', 'annual'],
+                'training': ['training', 'development', 'skill', 'course', 'capacity building', 'learning'],
+                'salary': ['salary', 'pay', 'grade', 'scale', 'compensation', 'structure']
             }
+            # Content categories - what each document type contains (including role-specific)
             content_categories = {
+                'pension_beneficiary': ['pension', 'retirement', 'eligibility', 'documents', 'application', 'certificate',
+                                      'family pension', 'gratuity', 'commutation', 'beneficiary', 'process', 'office'],
+                'procurement_officer': ['procurement', 'tender', 'bidding', 'contract', 'vendor', 'gem', 'msme',
+                                      'threshold', 'process', 'evaluation', 'registration', 'checklist', 'guidelines'],
+                'finance_staff': ['sanctioning', 'approval', 'budget', 'expenditure', 'treasury', 'audit',
+                                'financial', 'fund', 'payment', 'authorization', 'delegation', 'registers'],
+                'leadership_policymaker': ['policy', 'impact', 'scenario', 'analysis', 'evidence', 'comparative',
+                                         'evaluation', 'decision', 'strategic', 'implementation', 'assessment'],
                 'pension': ['pension', 'retirement', 'gratuity', 'provident fund', 'superannuation', 'benefits'],
                 'leave': ['leave', 'casual', 'earned', 'medical leave', 'maternity'],
                 'allowance': ['allowance', 'dearness', 'house rent', 'travel', 'da', 'hra', 'increment'],
                 'medical': ['medical', 'health', 'cghs', 'reimbursement', 'treatment'],
                 'transfer': ['transfer', 'posting', 'deputation', 'cadre'],
                 'promotion': ['promotion', 'seniority', 'grade pay', 'advancement'],
+                'audit': ['audit', 'financial', 'budget', 'expenditure', 'accounts', 'finance', 'yearly'],
+                'training': ['training', 'development', 'skill', 'course', 'capacity', 'learning'],
+                'salary': ['salary', 'pay', 'grade', 'scale', 'compensation', 'structure'],
                 'service': ['service rules', 'conduct', 'discipline', 'misconduct']
             }
             clause_text = doc.page_content
             # Simple extractive summary: first sentence or up to 2 lines
             summary = clause_text.split(". ")[0][:180] + ("..." if len(clause_text) > 180 else "")
+            # Enhanced role-aware checklist logic
+            role_checklist = generate_role_based_checklist(query, clause_text)
             results.append({
                 "clause_text": clause_text,
                 "summary": summary,