contract-risk-analyzer2

Sleeping

App Files Files Community

Kushalmanda commited on Jun 12, 2025

Commit

99543cd

verified ·

1 Parent(s): 5eac03e

Update app.py

Browse files

Files changed (1) hide show

app.py +259 -328

app.py CHANGED Viewed

@@ -9,10 +9,14 @@ from simple_salesforce import Salesforce
 import os
 import base64
 from io import BytesIO
-from datetime import datetime
-import pytz
-# Custom CSS for styling with full-page background image
 css = """
 body {
     background-image: url('https://images.unsplash.com/photo-1604147706283-d7119b5b822c?ixlib=rb-1.2.1&auto=format&fit=crop&w=1920&q=80');
@@ -20,248 +24,205 @@ body {
     background-position: center;
     background-attachment: fixed;
     background-repeat: no-repeat;
-    min-height: 100vh;  /* Ensures full height */
     margin: 0;
     padding: 0;
     font-family: Arial, sans-serif;
 }
 .gradio-container {
-    background-color: rgba(255, 255, 255, 0.9);
     border-radius: 10px;
     padding: 20px;
     margin: 20px;
-    max-width: 100%; /* Allow full width */
     box-shadow: 0 4px 12px rgba(0,0,0,0.15);
-    min-height: 90vh;  /* Make sure the container fills the screen */
 }
 .risk-low { color: #28a745; font-weight: bold; }
 .risk-medium { color: #ffc107; font-weight: bold; }
 .risk-high { color: #dc3545; font-weight: bold; }
-.result-box {
-    padding: 20px;
-    border-radius: 5px;
-    margin-bottom: 20px;
-    background-color: rgba(255, 255, 255, 0.8);
 }
-.penalty-box {
-    padding: 15px;
-    border-radius: 5px;
-    margin-bottom: 15px;
     border-left: 5px solid #dc3545;
-    background-color: rgba(255, 245, 245, 0.8);
 }
-.obligation-box {
-    padding: 15px;
-    border-radius: 5px;
-    margin-bottom: 15px;
     border-left: 5px solid #ffc107;
-    background-color: rgba(255, 249, 230, 0.8);
 }
-.delay-box {
-    padding: 15px;
-    border-radius: 5px;
-    margin-bottom: 15px;
     border-left: 5px solid #17a2b8;
-    background-color: rgba(230, 249, 255, 0.8);
 }
 .combined-risk-container {
     display: flex;
     flex-direction: column;
     gap: 10px;
     margin-bottom: 20px;
 }
 .risk-row {
     display: flex;
     align-items: center;
     gap: 15px;
     padding: 10px;
     border-radius: 5px;
-    background-color: rgba(248, 249, 250, 0.8);
 }
 .risk-label {
     width: 120px;
     font-weight: bold;
     font-size: 16px;
 }
 .risk-score {
     width: 100px;
     font-size: 18px;
     text-align: center;
 }
 .heatmap-wrapper {
     flex-grow: 1;
 }
 .warning-box {
     padding: 15px;
     border-radius: 5px;
     margin: 10px 0;
-    background-color: rgba(255, 243, 205, 0.8);
     border-left: 5px solid #ffc107;
     font-weight: bold;
 }
 .danger-box {
     padding: 15px;
     border-radius: 5px;
     margin: 10px 0;
-    background-color: rgba(248, 215, 218, 0.8);
     border-left: 5px solid #dc3545;
     font-weight: bold;
 }
 .success-box {
     padding: 15px;
     border-radius: 5px;
     margin: 10px 0;
-    background-color: rgba(212, 237, 218, 0.8);
     border-left: 5px solid #28a745;
     font-weight: bold;
 }
 .section-title {
     font-size: 20px;
     font-weight: bold;
     margin-bottom: 15px;
-    color: #333;
 }
 .count-item {
     display: flex;
     justify-content: space-between;
     padding: 10px 0;
-    border-bottom: 1px solid #eee;
 }
 .count-label {
     font-weight: bold;
 }
 .count-value {
-    color: #555;
 }
-.section-container {
-    margin-bottom: 25px;
-    padding: 15px;
-    border-radius: 5px;
-    background-color: rgba(248, 249, 250, 0.8);
 }
-.salesforce-success {
-    padding: 15px;
-    border-radius: 5px;
-    background-color: rgba(212, 237, 218, 0.8);
-    border-left: 5px solid #28a745;
-    margin-top: 20px;
-    font-weight: bold;
 }
-.salesforce-error {
-    padding: 15px;
-    border-radius: 5px;
-    background-color: rgba(248, 215, 218, 0.8);
-    border-left: 5px solid #dc3545;
-    margin-top: 20px;
-    font-weight: bold;
-}
-header {
-    background-color: rgba(13, 110, 253, 0.85);
-    color: white;
-    padding: 20px;
-    border-radius: 10px;
-    margin-bottom: 20px;
 }
-footer {
-    text-align: center;
-    margin-top: 30px;
-    padding: 15px;
-    background-color: rgba(0, 0, 0, 0.7);
-    color: white;
-    border-radius: 5px;
 }
-@media only screen and (max-width: 1200px) {
-    .gradio-container {
-        margin: 10px;
-    }
-    .risk-row {
-        flex-direction: column;
-        align-items: flex-start;
-    }
 }
 """
 # Salesforce credentials
-USERNAME = 'Kushalpavansekharm503@agentforce.com'
-PASSWORD = 'Kushal@123'
-SECURITY_TOKEN = 'WwUIFWBVUjeKn9VPKyWJmawY0'
-def get_salesforce_connection():
-    """Establishes connection to Salesforce"""
     try:
         sf = Salesforce(
-            username=USERNAME,
-            password=PASSWORD,
-            security_token=SECURITY_TOKEN
         )
         return sf
     except Exception as e:
-        print(f"Salesforce connection error: {str(e)}")
-        return None
-def create_salesforce_record(results: dict):
-    """Creates record in Salesforce Custom_Risk_Analysis__c object with automatic date handling."""
     try:
-        sf = get_salesforce_connection()
-        if not sf:
-            return None, "Failed to connect to Salesforce"
-        # Prepare the record data to create a record in Salesforce
-        record_data = {
-            'Risk_Score__c': results['risk_score'],
-            'Risk_Level__c': results['risk_level'],
-            'Penalty_Examples__c': results['penalty_examples'][:32768],  # Truncate to max length
-            'Penalty_Amounts__c': results['penalty_amounts'][:255],
-            'Penalty_Details__c': results['penalty_details'][:32768],
-            'Obligation_Details__c': results['obligation_details'][:32768],
-            'Delay_Details__c': results['delay_details'][:32768],
-            # Do not manually add the 'CreatedDate' field here as it is auto-managed by Salesforce
-        }
-        # Create the record in Salesforce
-        response = sf.Custom_Risk_Analysis__c.create(record_data)
-        # Check the response and return appropriate results
-        if response.get('success'):
-            return response.get('id'), None
-        else:
-            errors = response.get('errors', [])
-            error_msg = errors[0]['message'] if errors else "Unknown error"
-            return None, error_msg
     except Exception as e:
-        return None, f"Salesforce error: {str(e)}"
 def extract_text_from_pdf(pdf_path: str) -> str:
     """Extract text from PDF using pdfplumber"""
-    text = ""
-    with pdfplumber.open(pdf_path) as pdf:
-        for page in pdf.pages:
-            text += page.extract_text() or ""
-    return text
 def count_keywords(text: str, keywords: List[str]) -> Dict[str, int]:
     """Count occurrences of keywords in text"""
@@ -278,7 +239,7 @@ def find_penalty_values(text: str) -> List[float]:
         r'\d+\s*(?:percent|%)',
         r'(?:\b[a-z]+\s*)+dollars',
     ]
     penalties = []
     for pattern in patterns:
         matches = re.finditer(pattern, text, flags=re.IGNORECASE)
@@ -298,7 +259,7 @@ def calculate_risk_score(penalty_count: int, penalty_values: List[float], obliga
     """Calculate risk score based on various factors"""
     score = 0
     score += min(penalty_count * 5, 30)
     if penalty_values:
         avg_penalty = sum(penalty_values) / len(penalty_values)
         if avg_penalty > 1000000:
@@ -309,11 +270,11 @@ def calculate_risk_score(penalty_count: int, penalty_values: List[float], obliga
             score += 15
         else:
             score += 5
     score += min(obligation_count * 2, 20)
     score += min(delay_count * 10, 30)
     score = min(score, 100)
     if score < 30:
         return score, "Low"
     elif score < 70:
@@ -321,229 +282,199 @@ def calculate_risk_score(penalty_count: int, penalty_values: List[float], obliga
     else:
         return score, "High"
-def generate_combined_risk_display(risk_score: float, risk_level: str) -> Tuple[str, plt.Figure]:
-    """Generate a combined display with all three risk levels in one layout"""
-    fig, ax = plt.subplots(figsize=(10, 3))
-    ax.axis('off')
-    risk_levels = ["Low", "Medium", "High"]
-    colors = ['#28a745', '#ffc107', '#dc3545']
-    # Create HTML for the text display
-    html_parts = []
-    html_parts.append("<div class='combined-risk-container'>")
-    for i, level in enumerate(risk_levels):
-        active = level == risk_level
-        score = risk_score if active else 0
-        # Add to HTML
-        html_parts.append(f"""
-        <div class='risk-row'>
-            <div class='risk-label risk-{level.lower()}'>{level} Risk</div>
-            <div class='risk-score risk-{level.lower()}'>{score:.1f}%</div>
-            <div class='heatmap-wrapper'>
-                <img src='data:image/png;base64,{create_mini_heatmap(score, colors[i])}' style='width:100%'>
-            </div>
-        </div>
-        """)
-    html_parts.append("</div>")
-    return "\n".join(html_parts), fig
-def create_mini_heatmap(score: float, color: str) -> str:
-    """Create a small heatmap for one risk level"""
-    fig, ax = plt.subplots(figsize=(8, 0.5))
-    if score > 0:
-        gradient = np.linspace(0, score/100, 256).reshape(1, -1)
-    else:
-        gradient = np.zeros((1, 256))
-    gradient = np.vstack((gradient, gradient))
-    ax.imshow(gradient, aspect='auto', cmap=plt.cm.colors.LinearSegmentedColormap.from_list('custom', ['white', color]))
-    ax.set_axis_off()
-    plt.tight_layout()
-    # Save to base64 string
-    buf = BytesIO()
-    plt.savefig(buf, format='png', bbox_inches='tight', pad_inches=0)
-    plt.close(fig)
-    return base64.b64encode(buf.getvalue()).decode('utf-8')
-def format_warning_message(count: int, items: str, item_type: str) -> str:
-    """Format warning message based on count"""
-    if count == 0:
-        return f"""<div class="success-box">✓ No {item_type} clauses detected - Good!</div>"""
-    elif count < 5:
-        return f"""<div class="warning-box">⚠️ {count} {item_type} clauses detected</div>"""
-    else:
-        return f"""<div class="danger-box">⚠️⚠️ {count} {item_type} clauses detected - High Risk!</div>"""
-def create_vertical_count_display(counts: Dict[str, int], total: int, section_type: str) -> str:
-    """Create a vertical display for counts with section styling"""
-    items_html = []
-    for kw, count in counts.items():
-        items_html.append(f"""
-        <div class="count-item">
-            <span class="count-label">{kw.title()}:</span>
-            <span class="count-value">{count}</span>
-        </div>
-        """)
-    return f"""
-    <div class="section-container {section_type}-box">
-        <div class="section-title">{section_type.title()} Analysis</div>
-        <div style="margin-bottom: 10px;">
-            <span style="font-weight: bold;">Total:</span>
-            <span style="margin-left: 10px;">{total}</span>
-        </div>
-        {"".join(items_html)}
-    </div>
-    """
 def analyze_pdf(file_obj) -> List:
     """Main analysis function for Gradio interface"""
     try:
-        # Extract text from the uploaded file
-        text = extract_text_from_pdf(file_obj.name)
-        # Define keywords to search for
         penalty_keywords = ["penalty", "fine", "forfeit", "liquidated damages", "breach"]
         obligation_keywords = ["shall", "must", "required to", "obligated to", "duty"]
         delay_keywords = ["delay", "late", "overdue", "extension", "time is of the essence"]
-        # Count keyword occurrences
         penalty_counts = count_keywords(text, penalty_keywords)
         obligation_counts = count_keywords(text, obligation_keywords)
         delay_counts = count_keywords(text, delay_keywords)
-        # Find penalty values
         penalty_values = find_penalty_values(text)
-        # Calculate total counts
         total_penalties = sum(penalty_counts.values())
         total_obligations = sum(obligation_counts.values())
         total_delays = sum(delay_counts.values())
-        # Calculate risk score
-        risk_score, risk_level = calculate_risk_score(
-            total_penalties, penalty_values, total_obligations, total_delays
-        )
-        # Generate combined risk display
-        risk_display, _ = generate_combined_risk_display(risk_score, risk_level)
-        # Prepare warning/success messages
-        penalty_warning = format_warning_message(total_penalties, "penalty", "penalty")
-        obligation_warning = format_warning_message(total_obligations, "obligation", "obligation")
-        delay_warning = format_warning_message(total_delays, "delay", "delay")
-        # Create vertical displays
-        penalty_display = create_vertical_count_display(penalty_counts, total_penalties, "penalty")
-        obligation_display = create_vertical_count_display(obligation_counts, total_obligations, "obligation")
-        delay_display = create_vertical_count_display(delay_counts, total_delays, "delay")
-        # Combine warnings with displays
-        penalty_output = f"{penalty_warning}\n{penalty_display}"
-        obligation_output = f"{obligation_warning}\n{obligation_display}"
-        delay_output = f"{delay_warning}\n{delay_display}"
-        penalty_amounts = "\n".join([f"- ${amt:,.2f}" for amt in penalty_values[:5]]) if penalty_values else "No specific penalty amounts found"
-        # Find example sentences with penalties
         penalty_sentences = []
         for sentence in re.split(r'(?<=[.!?])\s+', text):
             if any(kw.lower() in sentence.lower() for kw in penalty_keywords):
                 penalty_sentences.append(sentence.strip())
         penalty_examples = "\n\n".join([f"{i+1}. {sent}" for i, sent in enumerate(penalty_sentences[:3])]) if penalty_sentences else "No penalty clauses found"
-        # Prepare Salesforce payload
-        salesforce_data = {
             'risk_score': risk_score,
             'risk_level': risk_level,
             'penalty_examples': penalty_examples,
-            'penalty_amounts': penalty_amounts,
-            'penalty_details': f"Total Penalties: {total_penalties}\n\n" + "\n".join([f"{kw}: {count}" for kw, count in penalty_counts.items()]),
-            'obligation_details': f"Total Obligations: {total_obligations}\n\n" + "\n".join([f"{kw}: {count}" for kw, count in obligation_counts.items()]),
-            'delay_details': f"Total Delays: {total_delays}\n\n" + "\n".join([f"{kw}: {count}" for kw, count in delay_counts.items()])
         }
-        # Create Salesforce record
-        record_id, error = create_salesforce_record(salesforce_data)
-        # **Removed the Record ID display in the output**
         return [
-            risk_display,
-            penalty_output,
-            penalty_amounts,
-            obligation_output,
-            delay_output,
-            penalty_examples,
         ]
     except Exception as e:
-        error_msg = f"<div class='salesforce-error'>❌ Processing error: {str(e)}</div>"
-        return [error_msg] * 7
-# Create Gradio interface with full-page layout
-with gr.Blocks(css=css, title="PDF Contract Risk Analyzer") as demo:
     gr.Markdown("""
-    <header>
-        <h1 style="text-align: center; margin: 0;">📄 PDF Contract Risk Analyzer</h1>
-        <p style="text-align: center; margin: 10px 0 0;">Upload a contract PDF to analyze penalties, obligations, and delays</p>
-    </header>
     """)
     with gr.Row():
         with gr.Column(scale=1):
-            file_input = gr.File(label="Upload PDF", file_types=[".pdf"])
             submit_btn = gr.Button("Analyze PDF", variant="primary")
-        with gr.Column(scale=2):
-            gr.Markdown("### 🔍 Overall Risk Assessment")
-            risk_display = gr.HTML(label="Risk Analysis")
     with gr.Row():
-        with gr.Column(scale=1):
-            gr.Markdown("### 📊 Penalties Analysis")
             penalty_count = gr.HTML(label="Penalty Clauses")
-            gr.Markdown("### Penalty Amounts")
-            penalty_amounts = gr.Textbox(label="", lines=5)
-        with gr.Column(scale=1):
-            gr.Markdown("### ⚖️ Obligations Analysis")
             obligation_count = gr.HTML(label="Obligation Clauses")
-        with gr.Column(scale=1):
-            gr.Markdown("### ⏱️ Delays Analysis")
             delay_count = gr.HTML(label="Delay Clauses")
     with gr.Row():
-        gr.Markdown("### 🔎 Extracted Penalty Clauses")
-        penalty_examples = gr.Textbox(label="Example Penalty Clauses", lines=5)
-    # Footer
-    #gr.Markdown("""
-    #<footer>
-        #<p>Contract Risk Analyzer • Securely analyze legal documents</p>
-        #<p>All analyses are stored securely in Salesforce</p>
-    #</footer>
-    #""")
     submit_btn.click(
         fn=analyze_pdf,
         inputs=file_input,
         outputs=[
-            risk_display,
-            penalty_count,
-            penalty_amounts,
-            obligation_count,
-            delay_count,
-            penalty_examples,
         ]
     )

 import os
 import base64
 from io import BytesIO
+import uuid
+import logging
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Custom CSS for styling with blue theme and hidden elements
 css = """
 body {
     background-image: url('https://images.unsplash.com/photo-1604147706283-d7119b5b822c?ixlib=rb-1.2.1&auto=format&fit=crop&w=1920&q=80');
     background-position: center;
     background-attachment: fixed;
     background-repeat: no-repeat;
+    min-height: 100vh;
     margin: 0;
     padding: 0;
     font-family: Arial, sans-serif;
 }
 .gradio-container {
+    background-color: rgba(240, 248, 255, 0.95) !important;
     border-radius: 10px;
     padding: 20px;
     margin: 20px;
+    max-width: 100%;
     box-shadow: 0 4px 12px rgba(0,0,0,0.15);
+    min-height: 90vh;
+    border: 1px solid #1e90ff !important;
 }
 .risk-low { color: #28a745; font-weight: bold; }
 .risk-medium { color: #ffc107; font-weight: bold; }
 .risk-high { color: #dc3545; font-weight: bold; }
+.result-box {
+    padding: 20px;
+    border-radius: 5px;
+    margin-bottom: 20px;
+    background-color: rgba(240, 248, 255, 0.9);
+    border-left: 5px solid #1e90ff !important;
 }
+.penalty-box {
+    padding: 15px;
+    border-radius: 5px;
+    margin-bottom: 15px;
     border-left: 5px solid #dc3545;
+    background-color: rgba(255, 245, 245, 0.9);
 }
+.obligation-box {
+    padding: 15px;
+    border-radius: 5px;
+    margin-bottom: 15px;
     border-left: 5px solid #ffc107;
+    background-color: rgba(255, 249, 230, 0.9);
 }
+.delay-box {
+    padding: 15px;
+    border-radius: 5px;
+    margin-bottom: 15px;
     border-left: 5px solid #17a2b8;
+    background-color: rgba(230, 249, 255, 0.9);
 }
 .combined-risk-container {
     display: flex;
     flex-direction: column;
     gap: 10px;
     margin-bottom: 20px;
 }
 .risk-row {
     display: flex;
     align-items: center;
     gap: 15px;
     padding: 10px;
     border-radius: 5px;
+    background-color: rgba(240, 248, 255, 0.8);
+    border: 1px solid #add8e6 !important;
 }
 .risk-label {
     width: 120px;
     font-weight: bold;
     font-size: 16px;
+    color: #1e4b8f !important;
 }
 .risk-score {
     width: 100px;
     font-size: 18px;
     text-align: center;
 }
 .heatmap-wrapper {
     flex-grow: 1;
 }
 .warning-box {
     padding: 15px;
     border-radius: 5px;
     margin: 10px 0;
+    background-color: rgba(255, 243, 205, 0.9);
     border-left: 5px solid #ffc107;
     font-weight: bold;
 }
 .danger-box {
     padding: 15px;
     border-radius: 5px;
     margin: 10px 0;
+    background-color: rgba(248, 215, 218, 0.9);
     border-left: 5px solid #dc3545;
     font-weight: bold;
 }
 .success-box {
     padding: 15px;
     border-radius: 5px;
     margin: 10px 0;
+    background-color: rgba(212, 237, 218, 0.9);
     border-left: 5px solid #28a745;
     font-weight: bold;
 }
 .section-title {
     font-size: 20px;
     font-weight: bold;
     margin-bottom: 15px;
+    color: #1e4b8f !important;
 }
 .count-item {
     display: flex;
     justify-content: space-between;
     padding: 10px 0;
+    border-bottom: 1px solid #add8e6 !important;
 }
 .count-label {
     font-weight: bold;
+    color: #1e4b8f !important;
 }
 .count-value {
+    color: #4169e1 !important;
 }
+button {
+    background: linear-gradient(135deg, #1e90ff, #4169e1) !important;
+    border: none !important;
+    color: white !important;
+    font-weight: bold !important;
 }
+button:hover {
+    background: linear-gradient(135deg, #4169e1, #1e90ff) !important;
 }
+.upload-area {
+    border: 2px dashed #1e90ff !important;
+    background-color: rgba(240, 248, 255, 0.7) !important;
 }
+.upload-area:hover {
+    background-color: rgba(224, 255, 255, 0.7) !important;
 }
+/* Hide elements */
+footer, .gradio-footer, .hide, [data-testid="Use via API"], [data-testid="mmsettings"] {
+    display: none !important;
+    visibility: hidden !important;
+    height: 0 !important;
+    width: 0 !important;
+    padding: 0 !important;
+    margin: 0 !important;
 }
 """
 # Salesforce credentials
+SF_USERNAME = "Kushalpavansekharm503@agentforce.com"
+SF_PASSWORD = "Kushal@123"
+SF_TOKEN = "WwUIFWBVUjeKn9VPKyWJmawY0"
+def authenticate_salesforce() -> Salesforce:
+    """Authenticate with Salesforce and return a Salesforce client"""
     try:
         sf = Salesforce(
+            username=SF_USERNAME,
+            password=SF_PASSWORD,
+            security_token=SF_TOKEN
         )
+        logger.info("Successfully authenticated with Salesforce")
         return sf
     except Exception as e:
+        logger.error(f"Failed to authenticate with Salesforce: {str(e)}")
+        raise Exception(f"Salesforce authentication failed: {str(e)}")
+# Warning message formatting
+def format_warning_message(count: int, items: str, item_type: str) -> str:
+    """Format warning message based on count"""
+    if count == 0:
+        return f"""<div class="success-box">✓ No {item_type} clauses detected - Good!</div>"""
+    elif count < 5:
+        return f"""<div class="warning-box">⚠️ {count} {item_type} clauses detected</div>"""
+    else:
+        return f"""<div class="danger-box">⚠️⚠️ {count} {item_type} clauses detected - High Risk!</div>"""
+def get_hugging_face_sentiment(text: str) -> float:
+    """Get sentiment score using Hugging Face model"""
     try:
+        from transformers import pipeline
+        classifier = pipeline("sentiment-analysis", model="distilbert-base-uncased-finetuned-sst-2-english")
+        result = classifier(text[:512])[0]
+        score = result['score'] if result['label'] == 'POSITIVE' else 1 - result['score']
+        return round(score, 2)
     except Exception as e:
+        logger.error(f"Hugging Face sentiment analysis failed: {str(e)}. Using fallback score.")
+        return 0.5
 def extract_text_from_pdf(pdf_path: str) -> str:
     """Extract text from PDF using pdfplumber"""
+    try:
+        text = ""
+        with pdfplumber.open(pdf_path) as pdf:
+            for page in pdf.pages:
+                page_text = page.extract_text()
+                if page_text:
+                    text += page_text
+        return text
+    except Exception as e:
+        logger.error(f"PDF text extraction failed: {str(e)}")
+        raise Exception(f"PDF text extraction failed: {str(e)}")
 def count_keywords(text: str, keywords: List[str]) -> Dict[str, int]:
     """Count occurrences of keywords in text"""
         r'\d+\s*(?:percent|%)',
         r'(?:\b[a-z]+\s*)+dollars',
     ]
     penalties = []
     for pattern in patterns:
         matches = re.finditer(pattern, text, flags=re.IGNORECASE)
     """Calculate risk score based on various factors"""
     score = 0
     score += min(penalty_count * 5, 30)
     if penalty_values:
         avg_penalty = sum(penalty_values) / len(penalty_values)
         if avg_penalty > 1000000:
             score += 15
         else:
             score += 5
     score += min(obligation_count * 2, 20)
     score += min(delay_count * 10, 30)
     score = min(score, 100)
     if score < 30:
         return score, "Low"
     elif score < 70:
     else:
         return score, "High"
+def generate_heatmap(risk_level: str):
+    """Generate a simple heatmap based on risk level"""
+    try:
+        fig, ax = plt.subplots(figsize=(8, 2))
+        if risk_level == "Low":
+            cmap = plt.cm.Blues
+        elif risk_level == "Medium":
+            cmap = plt.cm.Oranges
+        else:
+            cmap = plt.cm.Reds
+        gradient = np.linspace(0, 1, 256).reshape(1, -1)
+        gradient = np.vstack((gradient, gradient))
+        ax.imshow(gradient, aspect='auto', cmap=cmap)
+        ax.text(128, 0.5, f"{risk_level} Risk", color='white' if risk_level in ["High", "Medium"] else 'black',
+                ha='center', va='center', fontsize=24, fontweight='bold')
+        ax.set_axis_off()
+        plt.tight_layout()
+        return fig
+    except Exception as e:
+        logger.error(f"Heatmap generation failed: {str(e)}")
+        raise Exception(f"Heatmap generation failed: {str(e)}")
+def save_to_salesforce(sf: Salesforce, data: Dict):
+    """Save analysis results to Salesforce Custom_Risk_Analysis__c object"""
+    try:
+        record = {
+            'Sentiment_Score__c': data['sentiment_score'],
+            'Risk_Score__c': data['risk_score'],
+            'Risk_Level__c': data['risk_level'],
+            'Record_Id__c': data['record_id'],
+            'Penalty_Examples__c': data['penalty_examples'][:131072],
+            'Penalty_Details__c': data['penalty_details'][:131072],
+            'Penalty_Amounts__c': data['penalty_amounts'][:131072],
+            'Obligation_Details__c': data['obligation_details'][:131072],
+            'Delay_Details__c': data['delay_details'][:131072]
+        }
+        result = sf.Custom_Risk_Analysis__c.create(record)
+        logger.info(f"Successfully created Salesforce record: {result['id']}")
+        return result['id']
+    except Exception as e:
+        logger.error(f"Failed to save to Salesforce: {str(e)}")
+        raise Exception(f"Salesforce record creation failed: {str(e)}")
 def analyze_pdf(file_obj) -> List:
     """Main analysis function for Gradio interface"""
     try:
+        if not file_obj:
+            raise Exception("No PDF file uploaded. Please upload a valid PDF file.")
+        try:
+            sf = authenticate_salesforce()
+        except Exception as e:
+            raise Exception(f"Salesforce authentication failed: {str(e)}")
+        try:
+            text = extract_text_from_pdf(file_obj.name)
+            if not text.strip():
+                raise Exception("No text extracted from PDF. It might be a scanned document.")
+        except Exception as e:
+            raise Exception(f"PDF text extraction failed: {str(e)}")
+        try:
+            sentiment_score = get_hugging_face_sentiment(text)
+        except Exception as e:
+            logger.warning(f"Sentiment analysis failed: {str(e)}. Using fallback score of 0.5.")
+            sentiment_score = 0.5
         penalty_keywords = ["penalty", "fine", "forfeit", "liquidated damages", "breach"]
         obligation_keywords = ["shall", "must", "required to", "obligated to", "duty"]
         delay_keywords = ["delay", "late", "overdue", "extension", "time is of the essence"]
         penalty_counts = count_keywords(text, penalty_keywords)
         obligation_counts = count_keywords(text, obligation_keywords)
         delay_counts = count_keywords(text, delay_keywords)
         penalty_values = find_penalty_values(text)
         total_penalties = sum(penalty_counts.values())
         total_obligations = sum(obligation_counts.values())
         total_delays = sum(delay_counts.values())
+        try:
+            risk_score, risk_level = calculate_risk_score(
+                total_penalties, penalty_values, total_obligations, total_delays
+            )
+        except Exception as e:
+            raise Exception(f"Risk score calculation failed: {str(e)}")
+        try:
+            heatmap = generate_heatmap(risk_level)
+        except Exception as e:
+            raise Exception(f"Heatmap generation failed: {str(e)}")
+        penalty_details = "\n".join([f"<div class='count-item'><span class='count-label'>{kw}</span><span class='count-value'>{count}</span></div>" for kw, count in penalty_counts.items()])
+        obligation_details = "\n".join([f"<div class='count-item'><span class='count-label'>{kw}</span><span class='count-value'>{count}</span></div>" for kw, count in obligation_counts.items()])
+        delay_details = "\n".join([f"<div class='count-item'><span class='count-label'>{kw}</span><span class='count-value'>{count}</span></div>" for kw, count in delay_counts.items()])
+        penalty_amounts = "\n".join([f"<div class='count-item'><span class='count-label'>Amount</span><span class='count-value'>${amt:,.2f}</span></div>" for amt in penalty_values[:5]]) if penalty_values else "<div class='count-item'><span class='count-label'>No penalty amounts found</span><span class='count-value'>0</span></div>"
         penalty_sentences = []
         for sentence in re.split(r'(?<=[.!?])\s+', text):
             if any(kw.lower() in sentence.lower() for kw in penalty_keywords):
                 penalty_sentences.append(sentence.strip())
         penalty_examples = "\n\n".join([f"{i+1}. {sent}" for i, sent in enumerate(penalty_sentences[:3])]) if penalty_sentences else "No penalty clauses found"
+        record_id = str(uuid.uuid4())
+        sf_data = {
+            'sentiment_score': sentiment_score,
             'risk_score': risk_score,
             'risk_level': risk_level,
+            'record_id': record_id,
             'penalty_examples': penalty_examples,
+            'penalty_details': "\n".join([f"{kw}: {count}" for kw, count in penalty_counts.items()]),
+            'penalty_amounts': "\n".join([f"${amt:,.2f}" for amt in penalty_values[:5]]) if penalty_values else "No specific penalty amounts found",
+            'obligation_details': "\n".join([f"{kw}: {count}" for kw, count in obligation_counts.items()]),
+            'delay_details': "\n".join([f"{kw}: {count}" for kw, count in delay_counts.items()])
         }
+        try:
+            salesforce_record_id = save_to_salesforce(sf, sf_data)
+            logger.info(f"Saved to Salesforce with ID: {salesforce_record_id}")
+        except Exception as e:
+            logger.error(f"Salesforce record creation failed: {str(e)}")
+        box_class = "success-box" if risk_level == "Low" else "warning-box" if risk_level == "Medium" else "danger-box"
         return [
+            f"<div class='risk-row'><span class='risk-label'>Risk Score</span><span class='risk-score risk-{risk_level.lower()}'>{risk_score:.1f}/100</span></div>",
+            f"<div class='risk-row'><span class='risk-label'>Risk Level</span><span class='risk-score risk-{risk_level.lower()}'>{risk_level}</span></div>",
+            heatmap,
+            f"<div class='penalty-box'><div class='section-title'>Penalty Clauses (Total: {total_penalties})</div>{penalty_details}</div>",
+            f"<div class='penalty-box'><div class='section-title'>Penalty Amounts ({len(penalty_values)} found)</div>{penalty_amounts}</div>",
+            f"<div class='obligation-box'><div class='section-title'>Obligation Clauses (Total: {total_obligations})</div>{obligation_details}</div>",
+            f"<div class='delay-box'><div class='section-title'>Delay Clauses (Total: {total_delays})</div>{delay_details}</div>",
+            f"<div class='result-box'><div class='section-title'>Example Penalty Clauses</div>{penalty_examples}</div>",
+            f"<div class='{box_class}'><div class='section-title'>Sentiment Analysis</div>Sentiment Score: {sentiment_score}</div>"
         ]
     except Exception as e:
+        logger.error(f"Analysis failed: {str(e)}")
+        error_message = f"<div class='danger-box'>Error: {str(e)}</div>"
+        return [error_message] * 9
+# Create Gradio interface with blue theme and hidden elements
+with gr.Blocks(css=css, title="PDF Contract Risk Analyzer", theme=gr.themes.Default(primary_hue="blue")) as demo:
     gr.Markdown("""
+        <div style='text-align: center;'>
+            <h1 style='color: #1e4b8f;'>📄 PDF Contract Risk Analyzer</h1>
+            <p style='color: #4169e1;'>Upload a contract PDF to analyze penalties, obligations, delays, and sentiment.</p>
+        </div>
     """)
     with gr.Row():
         with gr.Column(scale=1):
+            file_input = gr.File(label="Upload PDF", file_types=[".pdf"], elem_classes="upload-area")
             submit_btn = gr.Button("Analyze PDF", variant="primary")
+        with gr.Column(scale=3):
+            gr.Markdown("<div class='section-title'>🔍 Overall Risk Assessment</div>")
+            with gr.Group(elem_classes="combined-risk-container"):
+                risk_score = gr.HTML(label="Risk Score")
+                risk_level = gr.HTML(label="Risk Level")
+                heatmap = gr.Plot(label="Risk Heatmap", elem_classes="heatmap-wrapper")
     with gr.Row():
+        with gr.Column():
             penalty_count = gr.HTML(label="Penalty Clauses")
+            penalty_amounts = gr.HTML(label="Penalty Amounts")
+        with gr.Column():
             obligation_count = gr.HTML(label="Obligation Clauses")
+        with gr.Column():
             delay_count = gr.HTML(label="Delay Clauses")
+    with gr.Row():
+        penalty_examples = gr.HTML(label="Example Penalty Clauses")
     with gr.Row():
+        additional_results = gr.HTML(label="Sentiment Analysis")
     submit_btn.click(
         fn=analyze_pdf,
         inputs=file_input,
         outputs=[
+            risk_score, risk_level, heatmap,
+            penalty_count, penalty_amounts,
+            obligation_count, delay_count,
+            penalty_examples, additional_results
         ]
     )