Spaces:

RoyAalekh
/

hackathon_code4change

Sleeping

File size: 12,907 Bytes

cecefdc
 
 
 
 
 
 
 
 
 
 
 
 
 
6a28f91
 
 
f6c65ef
 
 
 
cecefdc
 
 
 
f6c65ef
cecefdc
 
 
f6c65ef
cecefdc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f6c65ef
 
 
 
 
 
 
cecefdc
 
 
 
 
 
 
 
 
 
 
 
f6c65ef
 
 
 
 
 
 
 
 
cecefdc
7a39bba
 
 
cecefdc
 
 
f6c65ef
cecefdc
f6c65ef
cecefdc
 
 
f6c65ef
cecefdc
 
 
f6c65ef
cecefdc
 
 
f6c65ef
cecefdc
f6c65ef
cecefdc
 
f6c65ef
cecefdc
 
 
f6c65ef
cecefdc
f6c65ef
 
cecefdc
f6c65ef
 
cecefdc
 
f6c65ef
 
cecefdc
 
f6c65ef
 
cecefdc
f6c65ef
 
 
cecefdc
f6c65ef
cecefdc
 
f6c65ef
cecefdc
 
 
7a39bba
 
 
 
cecefdc
 
f6c65ef
 
 
 
 
 
 
 
 
 
 
 
cecefdc
 
 
 
f6c65ef
 
 
 
 
cecefdc
f6c65ef
cecefdc
 
 
f6c65ef
 
 
 
cecefdc
f6c65ef
 
 
7a39bba
 
 
 
 
 
f6c65ef
cecefdc
 
 
f6c65ef
 
 
 
 
 
 
cecefdc
 
f6c65ef
cecefdc
 
 
 
f6c65ef
07fb80f
 
 
 
 
 
 
 
 
cecefdc
 
7a39bba
cecefdc
07fb80f
cecefdc
 
f6c65ef
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cecefdc
f6c65ef
 
 
cecefdc
07fb80f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cecefdc
 
f6c65ef
 
 
 
 
cecefdc
 
 
 
f6c65ef
 
 
 
 
cecefdc
f6c65ef
 
 
cecefdc
 
f6c65ef
 
cecefdc
f6c65ef
 
cecefdc
f6c65ef
 
 
 
 
 
 
 
 
cecefdc
f6c65ef
cecefdc
 
 
f6c65ef
cecefdc
 
f6c65ef
cecefdc
 
7a39bba
 
 
f6c65ef
cecefdc
 
7a39bba
 
 
 
 
f6c65ef
cecefdc
 
7a39bba
 
 
 
 
f6c65ef
cecefdc
 
 
 
 
 
7a39bba
 
 
 
 
cecefdc
 
f6c65ef
cecefdc
 
 
 
 
7a39bba

"""Ripeness Classifier page - Interactive explainability and threshold tuning.

This page provides full transparency into how cases are classified as RIPE/UNRIPE/UNKNOWN,
allows interactive threshold tuning, and provides case-level explainability.
"""

from __future__ import annotations

from datetime import date, timedelta

import pandas as pd
import plotly.express as px
import streamlit as st

from src.core.case import Case, CaseStatus
from src.core.ripeness import RipenessClassifier, RipenessStatus
from src.dashboard.utils.data_loader import (
    attach_history_to_cases,
    load_generated_cases,
    load_generated_hearings,
)

# Page configuration
st.set_page_config(
    page_title="Ripeness Classifier",
    page_icon="target",
    layout="wide",
)

st.title("Ripeness Classifier - Explainability Dashboard")
st.markdown("Understand and tune the case readiness algorithm")

# Initialize session state for thresholds
if "min_service_hearings" not in st.session_state:
    st.session_state.min_service_hearings = 2
if "min_stage_days" not in st.session_state:
    st.session_state.min_stage_days = 30
if "min_case_age_days" not in st.session_state:
    st.session_state.min_case_age_days = 90

# Sidebar: Threshold controls
st.sidebar.header("Threshold Configuration")

st.sidebar.markdown("### Adjust Ripeness Thresholds")

min_service_hearings = st.sidebar.slider(
    "Min Service Hearings",
    min_value=0,
    max_value=10,
    value=st.session_state.min_service_hearings,
    step=1,
    help="Minimum number of service hearings before a case is considered RIPE",
)

min_stage_days = st.sidebar.slider(
    "Min Stage Days",
    min_value=0,
    max_value=180,
    value=st.session_state.min_stage_days,
    step=5,
    help="Minimum days in current stage",
)

min_case_age_days = st.sidebar.slider(
    "Min Case Age (days)",
    min_value=0,
    max_value=730,
    value=st.session_state.min_case_age_days,
    step=30,
    help="Minimum case age before considered RIPE",
)

# Detailed history toggle
use_history = st.sidebar.toggle(
    "Use detailed hearing history (if available)",
    value=True,
    help="When enabled, the classifier will use per-hearing history from hearings.csv if present.",
)

# Reset button
if st.sidebar.button("Reset to Defaults"):
    st.session_state.min_service_hearings = 2
    st.session_state.min_stage_days = 30
    st.session_state.min_case_age_days = 90
    st.rerun()

# Update session state
st.session_state.min_service_hearings = min_service_hearings
st.session_state.min_stage_days = min_stage_days
st.session_state.min_case_age_days = min_case_age_days

# Wire sidebar thresholds to the core classifier
RipenessClassifier.set_thresholds(
    {
        "MIN_SERVICE_HEARINGS": min_service_hearings,
        "MIN_STAGE_DAYS": min_stage_days,
        "MIN_CASE_AGE_DAYS": min_case_age_days,
    }
)

# Main content
tab1, tab2, tab3 = st.tabs(
    ["Current Configuration", "Interactive Testing", "Batch Classification"]
)

with tab1:
    st.markdown("### Current Classifier Configuration")

    col1, col2, col3 = st.columns(3)

    with col1:
        st.metric("Min Service Hearings", min_service_hearings)
        st.caption("Cases need at least this many service hearings")

    with col2:
        st.metric("Min Stage Days", min_stage_days)
        st.caption("Days in current stage threshold")

    with col3:
        st.metric("Min Case Age", f"{min_case_age_days} days")
        st.caption("Minimum case age requirement")

    st.markdown("---")

    # Classification logic flowchart
    st.markdown("### Classification Logic")

    with st.expander("View Decision Tree Logic"):
        st.markdown("""
        The ripeness classifier uses the following decision logic:

        **1. Service Hearings Check**
        - If `service_hearings < MIN_SERVICE_HEARINGS` -> **UNRIPE**

        **2. Case Age Check**
        - If `case_age < MIN_CASE_AGE_DAYS` -> **UNRIPE**

        **3. Stage-Specific Checks**
        - Each stage has minimum days requirement
        - If `days_in_stage < stage_requirement` -> **UNRIPE**

        **4. Keyword Analysis**
        - Certain keywords indicate ripeness (e.g., "reply filed", "arguments complete")
        - If keywords found -> **RIPE**

        **5. Final Classification**
        - If all criteria met -> **RIPE**
        - If some criteria failed but not critical -> **UNKNOWN**
        - Otherwise -> **UNRIPE**
        """)

    # Show stage-specific rules
    st.markdown("### Stage-Specific Rules")

    stage_rules = {
        "PRE-TRIAL": {"min_days": 60, "keywords": ["affidavit filed", "reply filed"]},
        "TRIAL": {"min_days": 45, "keywords": ["evidence complete", "cross complete"]},
        "POST-TRIAL": {
            "min_days": 30,
            "keywords": ["arguments complete", "written note"],
        },
        "FINAL DISPOSAL": {"min_days": 15, "keywords": ["disposed", "judgment"]},
    }

    df_rules = pd.DataFrame(
        [
            {
                "Stage": stage,
                "Min Days": rules["min_days"],
                "Keywords": ", ".join(rules["keywords"]),
            }
            for stage, rules in stage_rules.items()
        ]
    )

    st.dataframe(df_rules, use_container_width=True, hide_index=True)

with tab2:
    st.markdown("### Interactive Case Classification Testing")

    st.markdown(
        "Create a synthetic case and see how it would be classified with current thresholds"
    )

    col1, col2 = st.columns(2)

    with col1:
        case_id = st.text_input("Case ID", value="TEST-001")
        case_type = st.selectbox("Case Type", ["CIVIL", "CRIMINAL", "WRIT", "PIL"])
        case_stage = st.selectbox(
            "Current Stage", ["PRE-TRIAL", "TRIAL", "POST-TRIAL", "FINAL DISPOSAL"]
        )

    with col2:
        service_hearings_count = st.number_input(
            "Service Hearings", min_value=0, max_value=20, value=3
        )
        days_in_stage = st.number_input(
            "Days in Stage", min_value=0, max_value=365, value=45
        )
        case_age = st.number_input(
            "Case Age (days)", min_value=0, max_value=3650, value=120
        )

    # Keywords
    has_keywords = st.multiselect(
        "Keywords Found",
        options=[
            "reply filed",
            "affidavit filed",
            "arguments complete",
            "evidence complete",
            "written note",
        ],
        default=[],
    )

    if st.button("Classify Case"):
        # Create synthetic case
        today = date.today()
        filed_date = today - timedelta(days=case_age)

        # Map UI-friendly stage labels to classifier's internal stage names
        stage_map = {
            "PRE-TRIAL": "ADMISSION",  # early-stage administrative
            "TRIAL": "EVIDENCE",  # substantive stage
            "POST-TRIAL": "ORDERS / JUDGMENT",  # arguments/orders phase
            "FINAL DISPOSAL": "FINAL DISPOSAL",
        }
        classifier_stage = stage_map.get(case_stage, case_stage)

        test_case = Case(
            case_id=case_id,
            case_type=case_type,
            filed_date=filed_date,
            current_stage=classifier_stage,
            status=CaseStatus.PENDING,
        )

        # Populate aggregates and optional purpose based on selected keywords
        test_case.hearing_count = service_hearings_count
        test_case.days_in_stage = int(days_in_stage)
        test_case.age_days = int(case_age)
        test_case.last_hearing_purpose = has_keywords[0] if has_keywords else None

        # Use the real classifier
        status = RipenessClassifier.classify(test_case)
        reason = RipenessClassifier.get_ripeness_reason(status)

        color = (
            "green"
            if status == RipenessStatus.RIPE
            else ("red" if status.is_unripe() else "orange")
        )
        st.markdown("### Classification Result")
        st.markdown(f":{color}[**{status.value}**]")
        st.caption(reason)

        # Debug details to explain classification
        with st.expander("Why this classification? (debug)"):
            thresholds = RipenessClassifier.get_current_thresholds()
            service_ok = service_hearings_count >= thresholds[
                "MIN_SERVICE_HEARINGS"
            ] or bool(test_case.last_hearing_purpose)
            compliance_ok = (
                classifier_stage not in RipenessClassifier.UNRIPE_STAGES
                or days_in_stage >= thresholds["MIN_STAGE_DAYS"]
            )
            age_ok = case_age >= thresholds["MIN_CASE_AGE_DAYS"]

            st.write(
                {
                    "ui_stage": case_stage,
                    "classifier_stage": classifier_stage,
                    "hearing_count": service_hearings_count,
                    "days_in_stage": int(days_in_stage),
                    "age_days": int(case_age),
                    "last_hearing_purpose": test_case.last_hearing_purpose,
                    "evidence": {
                        "service_ok": service_ok,
                        "compliance_ok": compliance_ok,
                        "age_ok": age_ok,
                        "all_ok": service_ok and compliance_ok and age_ok,
                    },
                    "thresholds": thresholds,
                }
            )

with tab3:
    st.markdown("### Batch Classification Analysis")

    st.markdown(
        "Load generated test cases and classify them with current thresholds (core classifier)"
    )

    if st.button("Load & Classify Test Cases"):
        with st.spinner("Loading cases..."):
            try:
                cases = load_generated_cases()

                if use_history:
                    hearings_df = load_generated_hearings()
                    cases = attach_history_to_cases(cases, hearings_df)

                if not cases:
                    st.warning(
                        "No test cases found. Generate cases first: `uv run court-scheduler generate`"
                    )
                else:
                    st.success(f"Loaded {len(cases)} test cases")

                    # Classify all cases using the core classifier
                    classifications = {"RIPE": 0, "UNRIPE": 0, "UNKNOWN": 0}

                    today = date.today()
                    for case in cases:
                        # Ensure aggregates are available
                        case.age_days = (today - case.filed_date).days
                        if getattr(case, "stage_start_date", None):
                            case.days_in_stage = (today - case.stage_start_date).days
                        else:
                            case.days_in_stage = case.age_days

                        status = RipenessClassifier.classify(case)
                        if status == RipenessStatus.RIPE:
                            classifications["RIPE"] += 1
                        elif status == RipenessStatus.UNKNOWN:
                            classifications["UNKNOWN"] += 1
                        else:
                            classifications["UNRIPE"] += 1

                    # Display results
                    col1, col2, col3 = st.columns(3)

                    with col1:
                        pct = classifications["RIPE"] / len(cases) * 100
                        st.metric(
                            "RIPE Cases", f"{classifications['RIPE']:,}", f"{pct:.1f}%"
                        )

                    with col2:
                        pct = classifications["UNKNOWN"] / len(cases) * 100
                        st.metric(
                            "UNKNOWN Cases",
                            f"{classifications['UNKNOWN']:,}",
                            f"{pct:.1f}%",
                        )

                    with col3:
                        pct = classifications["UNRIPE"] / len(cases) * 100
                        st.metric(
                            "UNRIPE Cases",
                            f"{classifications['UNRIPE']:,}",
                            f"{pct:.1f}%",
                        )

                    # Pie chart
                    fig = px.pie(
                        values=list(classifications.values()),
                        names=list(classifications.keys()),
                        title="Classification Distribution",
                        color=list(classifications.keys()),
                        color_discrete_map={
                            "RIPE": "green",
                            "UNKNOWN": "orange",
                            "UNRIPE": "red",
                        },
                    )
                    st.plotly_chart(fig, use_container_width=True)

            except Exception as e:
                st.error(f"Error loading cases: {e}")

# Footer
st.markdown("---")
st.markdown(
    "*Adjust thresholds in the sidebar to see real-time impact on classification*"
)