Spaces:

RoyAalekh
/

hackathon_code4change

Sleeping

App Files Files Community

RoyAalekh commited on Dec 1, 2025

Commit

7a39bba

1 Parent(s): b5f21c3

Fixed app.py and data insights page

Browse files

Files changed (3) hide show

scheduler/dashboard/app.py +50 -47
scheduler/dashboard/pages/1_Data_And_Insights.py +119 -51
scheduler/dashboard/pages/2_Ripeness_Classifier.py +35 -10

scheduler/dashboard/app.py CHANGED Viewed

@@ -1,13 +1,11 @@
 """Main dashboard application for Court Scheduling System.
 This is the entry point for the Streamlit multi-page dashboard.
-Launch with: uv run court-scheduler dashboard
 """
 from __future__ import annotations
-import subprocess
-from pathlib import Path
 import streamlit as st
@@ -21,29 +19,17 @@ st.set_page_config(
     initial_sidebar_state="expanded",
 )
-# Enforce `uv` availability for all dashboard-triggered commands
-try:
-    uv_check = subprocess.run(["uv", "--version"], capture_output=True, text=True)
-    if uv_check.returncode != 0:
-        raise RuntimeError(uv_check.stderr or "uv not available")
-except Exception:
-    import streamlit as st
-    st.error(
-        "'uv' is required to run this dashboard's commands. Please install uv and rerun.\n\n"
-        "Install on macOS/Linux: `curl -LsSf https://astral.sh/uv/install.sh | sh`\n"
-        "Install on Windows (PowerShell): `irm https://astral.sh/uv/install.ps1 | iex`"
-    )
-    st.stop()
 # Main page content
 st.title("Court Scheduling System Dashboard")
-st.markdown("**Karnataka High Court - Algorithmic Decision Support for Fair Scheduling**")
 st.markdown("---")
 # Introduction
-st.markdown("""
 ### Overview
 This system provides data-driven scheduling recommendations while maintaining judicial control and autonomy.
@@ -57,7 +43,8 @@ This system provides data-driven scheduling recommendations while maintaining ju
 - Reinforcement learning optimization
 Use the sidebar to navigate between sections.
-""")
 # System status
 status_header_col1, status_header_col2 = st.columns([3, 1])
@@ -93,47 +80,57 @@ with col3:
         st.caption("Run EDA pipeline to generate visualizations")
 # Setup Controls
-eda_ready = data_status["cleaned_data"] and data_status["parameters"] and data_status["eda_figures"]
 if not eda_ready:
     st.markdown("---")
     st.markdown("### Initial Setup")
-    st.warning("Run the EDA pipeline to process historical data and extract parameters.")
     col1, col2 = st.columns([2, 1])
     with col1:
-        st.markdown("""
         The EDA pipeline:
         - Loads and cleans historical court case data
         - Extracts statistical parameters (distributions, transition probabilities)
         - Generates analysis visualizations
         This is required before using other dashboard features.
-        """)
     with col2:
         if st.button("Run EDA Pipeline", type="primary", use_container_width=True):
-            import subprocess
             with st.spinner("Running EDA pipeline... This may take a few minutes."):
                 try:
-                    result = subprocess.run(
-                        ["uv", "run", "court-scheduler", "eda"],
-                        capture_output=True,
-                        text=True,
-                        cwd=str(Path.cwd()),
-                    )
-                    if result.returncode == 0:
-                        st.success("EDA pipeline completed")
-                        st.rerun()
-                    else:
-                        st.error(f"Pipeline failed with error code {result.returncode}")
-                        with st.expander("Show error details"):
-                            st.code(result.stderr, language="text")
                 except Exception as e:
-                    st.error(f"Error running pipeline: {e}")
     with st.expander("Run manually via CLI"):
         st.code("uv run court-scheduler eda", language="bash")
@@ -148,7 +145,8 @@ st.markdown("### Dashboard Sections")
 col1, col2 = st.columns(2)
 with col1:
-    st.markdown("""
     #### 1. Data & Insights
     Explore historical case data, view analysis visualizations, and review extracted parameters.
@@ -157,10 +155,12 @@ with col1:
     #### 3. Simulation Workflow
     Generate cases, configure simulation parameters, run scheduling simulations, and view results.
-    """)
 with col2:
-    st.markdown("""
     #### 4. Cause Lists & Overrides
     View generated cause lists, make judge overrides, and track modification history.
@@ -169,13 +169,15 @@ with col2:
     #### 6. Analytics & Reports
     Compare simulation runs, analyze performance metrics, and export comprehensive reports.
-    """)
 st.markdown("---")
 # Typical Workflow
 with st.expander("Typical Usage Workflow"):
-    st.markdown("""
     **Step 1: Initial Setup**
     - Run EDA pipeline to process historical data (one-time setup)
@@ -202,7 +204,8 @@ with st.expander("Typical Usage Workflow"):
     - Use Analytics & Reports to evaluate fairness and efficiency
     - Compare different scheduling policies
     - Identify bottlenecks and improvement opportunities
-    """)
 # Footer
 st.markdown("---")

 """Main dashboard application for Court Scheduling System.
 This is the entry point for the Streamlit multi-page dashboard.
+Launch with: uv run court-scheduler dashboard  (or `streamlit run` directly)
 """
 from __future__ import annotations
 import streamlit as st
     initial_sidebar_state="expanded",
 )
 # Main page content
 st.title("Court Scheduling System Dashboard")
+st.markdown(
+    "**Karnataka High Court - Algorithmic Decision Support for Fair Scheduling**"
+)
 st.markdown("---")
 # Introduction
+st.markdown(
+    """
 ### Overview
 This system provides data-driven scheduling recommendations while maintaining judicial control and autonomy.
 - Reinforcement learning optimization
 Use the sidebar to navigate between sections.
+"""
+)
 # System status
 status_header_col1, status_header_col2 = st.columns([3, 1])
         st.caption("Run EDA pipeline to generate visualizations")
 # Setup Controls
+eda_ready = (
+    data_status["cleaned_data"]
+    and data_status["parameters"]
+    and data_status["eda_figures"]
+)
 if not eda_ready:
     st.markdown("---")
     st.markdown("### Initial Setup")
+    st.warning(
+        "Run the EDA pipeline to process historical data and extract parameters."
+    )
     col1, col2 = st.columns([2, 1])
     with col1:
+        st.markdown(
+            """
         The EDA pipeline:
         - Loads and cleans historical court case data
         - Extracts statistical parameters (distributions, transition probabilities)
         - Generates analysis visualizations
         This is required before using other dashboard features.
+        """
+        )
     with col2:
         if st.button("Run EDA Pipeline", type="primary", use_container_width=True):
+            from eda.load_clean import run_load_and_clean
+            from eda.exploration import run_exploration
+            from eda.parameters import run_parameter_export
             with st.spinner("Running EDA pipeline... This may take a few minutes."):
                 try:
+                    # Step 1: Load & clean data
+                    run_load_and_clean()
+                    # Step 2: Generate visualizations
+                    run_exploration()
+                    # Step 3: Extract parameters
+                    run_parameter_export()
+                    st.success("EDA pipeline completed")
+                    st.rerun()
                 except Exception as e:
+                    st.error("Pipeline failed while running inside the dashboard.")
+                    with st.expander("Show error details"):
+                        st.exception(e)
     with st.expander("Run manually via CLI"):
         st.code("uv run court-scheduler eda", language="bash")
 col1, col2 = st.columns(2)
 with col1:
+    st.markdown(
+        """
     #### 1. Data & Insights
     Explore historical case data, view analysis visualizations, and review extracted parameters.
     #### 3. Simulation Workflow
     Generate cases, configure simulation parameters, run scheduling simulations, and view results.
+    """
+    )
 with col2:
+    st.markdown(
+        """
     #### 4. Cause Lists & Overrides
     View generated cause lists, make judge overrides, and track modification history.
     #### 6. Analytics & Reports
     Compare simulation runs, analyze performance metrics, and export comprehensive reports.
+    """
+    )
 st.markdown("---")
 # Typical Workflow
 with st.expander("Typical Usage Workflow"):
+    st.markdown(
+        """
     **Step 1: Initial Setup**
     - Run EDA pipeline to process historical data (one-time setup)
     - Use Analytics & Reports to evaluate fairness and efficiency
     - Compare different scheduling policies
     - Identify bottlenecks and improvement opportunities
+    """
+    )
 # Footer
 st.markdown("---")

scheduler/dashboard/pages/1_Data_And_Insights.py CHANGED Viewed

@@ -70,7 +70,9 @@ def load_dashboard_data():
 with st.spinner("Loading data..."):
     try:
-        cases_df, hearings_df, params, stats, total_cases, total_hearings = load_dashboard_data()
     except Exception as e:
         st.error(f"Error loading data: {e}")
         st.info("Please run the EDA pipeline first: `uv run court-scheduler eda`")
@@ -96,28 +98,25 @@ if cases_df.empty and hearings_df.empty:
     with col1:
         if st.button("Run EDA Pipeline Now", type="primary", use_container_width=True):
-            import subprocess
             with st.spinner("Running EDA pipeline... This will take a few minutes."):
                 try:
-                    result = subprocess.run(
-                        ["uv", "run", "court-scheduler", "eda"],
-                        capture_output=True,
-                        text=True,
-                        cwd=str(Path.cwd()),
-                    )
-                    if result.returncode == 0:
-                        st.success("EDA pipeline completed successfully!")
-                        st.info("Reload this page to see the data.")
-                        if st.button("Reload Page"):
-                            st.rerun()
-                    else:
-                        st.error(f"Pipeline failed with error code {result.returncode}")
-                        with st.expander("Error details"):
-                            st.code(result.stderr, language="text")
                 except Exception as e:
-                    st.error(f"Error: {e}")
     with col2:
         with st.expander("Alternative: Run via CLI"):
@@ -133,7 +132,9 @@ col1, col2, col3, col4, col5 = st.columns(5)
 with col1:
     st.metric("Total Cases", f"{total_cases:,}")
     if "YEAR_FILED" in cases_df.columns:
-        year_range = f"{cases_df['YEAR_FILED'].min():.0f}-{cases_df['YEAR_FILED'].max():.0f}"
         st.caption(f"Years: {year_range}")
 with col2:
@@ -176,7 +177,9 @@ with col5:
 st.markdown("---")
 # Main tabs
-tab1, tab2, tab3 = st.tabs(["Historical Analysis", "Interactive Exploration", "Parameters"])
 # TAB 1: Historical Analysis - Pre-generated figures
 with tab1:
@@ -188,11 +191,15 @@ with tab1:
     figures_dir = Path("reports/figures")
     if not figures_dir.exists():
-        st.warning("EDA figures not found. Run the EDA pipeline to generate visualizations.")
         st.code("uv run court-scheduler eda")
     else:
         # Find latest versioned directory
-        version_dirs = [d for d in figures_dir.iterdir() if d.is_dir() and d.name.startswith("v")]
         if not version_dirs:
             st.warning(
@@ -207,7 +214,9 @@ with tab1:
             # List available figures from the versioned directory
             # Exclude deprecated/removed visuals like the monthly waterfall
             figure_files = [
-                f for f in sorted(latest_dir.glob("*.html")) if "waterfall" not in f.name.lower()
             ]
             if not figure_files:
@@ -227,10 +236,14 @@ with tab1:
                     if any(x in f.name for x in ["stage", "sankey", "transition"])
                 ]
                 time_figs = [
-                    f for f in figure_files if any(x in f.name for x in ["monthly", "load", "gap"])
                 ]
                 other_figs = [
-                    f for f in figure_files if f not in distribution_figs + stage_figs + time_figs
                 ]
                 # Category 1: Case Distributions
@@ -325,7 +338,9 @@ with tab2:
         selected_stages = st.sidebar.multiselect(
             "Stages",
             options=available_stages,
-            default=available_stages[:10] if len(available_stages) > 10 else available_stages,
             key="stage_filter",
         )
     else:
@@ -334,12 +349,16 @@ with tab2:
     # Apply filters with copy to ensure clean dataframes
     if selected_case_types and case_type_col:
-        filtered_cases = cases_df[cases_df[case_type_col].isin(selected_case_types)].copy()
     else:
         filtered_cases = cases_df.copy()
     if selected_stages and stage_col:
-        filtered_hearings = hearings_df[hearings_df[stage_col].isin(selected_stages)].copy()
     else:
         filtered_hearings = hearings_df.copy()
@@ -370,9 +389,9 @@ with tab2:
     with col4:
         if "Outcome" in filtered_hearings.columns and len(filtered_hearings) > 0:
-            adj_rate_filtered = (filtered_hearings["Outcome"] == "ADJOURNED").sum() / len(
-                filtered_hearings
-            )
             st.metric("Adjournment Rate", f"{adj_rate_filtered:.1%}")
         else:
             st.metric("Adjournment Rate", "N/A")
@@ -387,9 +406,15 @@ with tab2:
     with sub_tab1:
         st.markdown("#### Case Distribution by Type")
-        if case_type_col and case_type_col in filtered_cases.columns and len(filtered_cases) > 0:
             # Compute value counts and ensure proper structure
-            case_type_counts = filtered_cases[case_type_col].value_counts().reset_index()
             # Rename columns for clarity (works across pandas versions)
             case_type_counts.columns = ["CaseType", "Count"]
@@ -428,7 +453,11 @@ with tab2:
     with sub_tab2:
         st.markdown("#### Stage Analysis")
-        if stage_col and stage_col in filtered_hearings.columns and len(filtered_hearings) > 0:
             stage_counts = filtered_hearings[stage_col].value_counts().reset_index()
             stage_counts.columns = ["Stage", "Count"]
@@ -465,7 +494,10 @@ with tab2:
                 not_adjourned = total_hearings - adjourned
                 outcome_df = pd.DataFrame(
-                    {"Outcome": ["ADJOURNED", "NOT ADJOURNED"], "Count": [adjourned, not_adjourned]}
                 )
                 fig_pie = px.pie(
@@ -474,7 +506,10 @@ with tab2:
                     names="Outcome",
                     title=f"Outcome Distribution (Total: {total_hearings:,})",
                     color="Outcome",
-                    color_discrete_map={"ADJOURNED": "#ef4444", "NOT ADJOURNED": "#22c55e"},
                 )
                 fig_pie.update_layout(height=400)
                 st.plotly_chart(fig_pie, use_container_width=True)
@@ -483,7 +518,9 @@ with tab2:
                 st.markdown("**By Stage**")
                 adj_by_stage = (
                     filtered_hearings.groupby(stage_col)["Outcome"]
-                    .apply(lambda x: (x == "ADJOURNED").sum() / len(x) if len(x) > 0 else 0)
                     .reset_index()
                 )
                 adj_by_stage.columns = ["Stage", "Rate"]
@@ -507,7 +544,9 @@ with tab2:
     with sub_tab4:
         st.markdown("#### Raw Data")
-        data_view = st.radio("Select data to view:", ["Cases", "Hearings"], horizontal=True)
         if data_view == "Cases":
             st.dataframe(
@@ -516,7 +555,9 @@ with tab2:
                 height=600,
             )
-            st.markdown(f"**Showing first 500 of {len(filtered_cases):,} filtered cases**")
             # Download button
             csv = filtered_cases.to_csv(index=False).encode("utf-8")
@@ -533,7 +574,9 @@ with tab2:
                 height=600,
             )
-            st.markdown(f"**Showing first 500 of {len(filtered_hearings):,} filtered hearings**")
             # Download button
             csv = filtered_hearings.to_csv(index=False).encode("utf-8")
@@ -559,7 +602,10 @@ with tab3:
         st.markdown("#### Case Types")
         if "case_types" in params and params["case_types"]:
             case_types_df = pd.DataFrame(
-                {"Case Type": params["case_types"], "Index": range(len(params["case_types"]))}
             )
             st.dataframe(case_types_df, use_container_width=True, hide_index=True)
             st.caption(f"Total: {len(params['case_types'])} case types")
@@ -594,9 +640,13 @@ with tab3:
                     with st.expander(f"From: {stage}"):
                         trans_df = pd.DataFrame(transitions)
                         if not trans_df.empty:
-                            st.dataframe(trans_df, use_container_width=True, hide_index=True)
-            st.caption(f"Total: {len(params['stage_graph'])} stages with transition data")
         else:
             st.info("No stage transition data found")
@@ -609,8 +659,12 @@ with tab3:
             # Create heatmap
             adj_stats = params["adjournment_stats"]
-            stages_list = list(adj_stats.keys())[:20]  # Limit to 20 stages for readability
-            case_types_list = params.get("case_types", [])[:15]  # Limit to 15 case types
             if stages_list and case_types_list:
                 heatmap_data = []
@@ -656,7 +710,12 @@ with tab3:
         """)
         config_tab1, config_tab2, config_tab3, config_tab4 = st.tabs(
-            ["EDA Parameters", "Ripeness Classifier", "Case Generator", "Simulation Defaults"]
         )
         with config_tab1:
@@ -857,7 +916,10 @@ UNRIPE cases: 0.7x priority
                 from scheduler.data.config import MONTHLY_SEASONALITY
                 season_df = pd.DataFrame(
-                    [{"Month": i, "Factor": MONTHLY_SEASONALITY.get(i, 1.0)} for i in range(1, 13)]
                 )
                 st.dataframe(season_df, use_container_width=True, hide_index=True)
                 st.caption("1.0 = average, >1.0 = more cases, <1.0 = fewer cases")
@@ -900,7 +962,9 @@ Ripe purposes (80% probability):
                 """,
                     language="text",
                 )
-                st.caption("Early ADMISSION: 40% bottleneck, Advanced stages: mostly ripe")
         with config_tab4:
             st.markdown("#### Simulation Defaults")
@@ -930,8 +994,12 @@ Formula:
                 st.markdown("**Courtroom Capacity**")
                 if params and "court_capacity_global" in params:
                     cap = params["court_capacity_global"]
-                    st.metric("Median slots/day", f"{cap.get('slots_median_global', 151):.0f}")
-                    st.metric("P90 slots/day", f"{cap.get('slots_p90_global', 200):.0f}")
                 else:
                     st.info("Run EDA to load capacity statistics")

 with st.spinner("Loading data..."):
     try:
+        cases_df, hearings_df, params, stats, total_cases, total_hearings = (
+            load_dashboard_data()
+        )
     except Exception as e:
         st.error(f"Error loading data: {e}")
         st.info("Please run the EDA pipeline first: `uv run court-scheduler eda`")
     with col1:
         if st.button("Run EDA Pipeline Now", type="primary", use_container_width=True):
+            from eda.load_clean import run_load_and_clean
+            from eda.exploration import run_exploration
+            from eda.parameters import run_parameter_export
             with st.spinner("Running EDA pipeline... This will take a few minutes."):
                 try:
+                    # Step 1: Load & clean data
+                    run_load_and_clean()
+                    # Step 2: Generate visualizations
+                    run_exploration()
+                    # Step 3: Extract parameters
+                    run_parameter_export()
+                    st.success("EDA pipeline completed successfully!")
+                    st.info("Reload this page to see the updated data.")
+                    if st.button("Reload Page"):
+                        st.rerun()
                 except Exception as e:
+                    with st.expander("Error details"):
+                        st.exception(e)
     with col2:
         with st.expander("Alternative: Run via CLI"):
 with col1:
     st.metric("Total Cases", f"{total_cases:,}")
     if "YEAR_FILED" in cases_df.columns:
+        year_range = (
+            f"{cases_df['YEAR_FILED'].min():.0f}-{cases_df['YEAR_FILED'].max():.0f}"
+        )
         st.caption(f"Years: {year_range}")
 with col2:
 st.markdown("---")
 # Main tabs
+tab1, tab2, tab3 = st.tabs(
+    ["Historical Analysis", "Interactive Exploration", "Parameters"]
+)
 # TAB 1: Historical Analysis - Pre-generated figures
 with tab1:
     figures_dir = Path("reports/figures")
     if not figures_dir.exists():
+        st.warning(
+            "EDA figures not found. Run the EDA pipeline to generate visualizations."
+        )
         st.code("uv run court-scheduler eda")
     else:
         # Find latest versioned directory
+        version_dirs = [
+            d for d in figures_dir.iterdir() if d.is_dir() and d.name.startswith("v")
+        ]
         if not version_dirs:
             st.warning(
             # List available figures from the versioned directory
             # Exclude deprecated/removed visuals like the monthly waterfall
             figure_files = [
+                f
+                for f in sorted(latest_dir.glob("*.html"))
+                if "waterfall" not in f.name.lower()
             ]
             if not figure_files:
                     if any(x in f.name for x in ["stage", "sankey", "transition"])
                 ]
                 time_figs = [
+                    f
+                    for f in figure_files
+                    if any(x in f.name for x in ["monthly", "load", "gap"])
                 ]
                 other_figs = [
+                    f
+                    for f in figure_files
+                    if f not in distribution_figs + stage_figs + time_figs
                 ]
                 # Category 1: Case Distributions
         selected_stages = st.sidebar.multiselect(
             "Stages",
             options=available_stages,
+            default=available_stages[:10]
+            if len(available_stages) > 10
+            else available_stages,
             key="stage_filter",
         )
     else:
     # Apply filters with copy to ensure clean dataframes
     if selected_case_types and case_type_col:
+        filtered_cases = cases_df[
+            cases_df[case_type_col].isin(selected_case_types)
+        ].copy()
     else:
         filtered_cases = cases_df.copy()
     if selected_stages and stage_col:
+        filtered_hearings = hearings_df[
+            hearings_df[stage_col].isin(selected_stages)
+        ].copy()
     else:
         filtered_hearings = hearings_df.copy()
     with col4:
         if "Outcome" in filtered_hearings.columns and len(filtered_hearings) > 0:
+            adj_rate_filtered = (
+                filtered_hearings["Outcome"] == "ADJOURNED"
+            ).sum() / len(filtered_hearings)
             st.metric("Adjournment Rate", f"{adj_rate_filtered:.1%}")
         else:
             st.metric("Adjournment Rate", "N/A")
     with sub_tab1:
         st.markdown("#### Case Distribution by Type")
+        if (
+            case_type_col
+            and case_type_col in filtered_cases.columns
+            and len(filtered_cases) > 0
+        ):
             # Compute value counts and ensure proper structure
+            case_type_counts = (
+                filtered_cases[case_type_col].value_counts().reset_index()
+            )
             # Rename columns for clarity (works across pandas versions)
             case_type_counts.columns = ["CaseType", "Count"]
     with sub_tab2:
         st.markdown("#### Stage Analysis")
+        if (
+            stage_col
+            and stage_col in filtered_hearings.columns
+            and len(filtered_hearings) > 0
+        ):
             stage_counts = filtered_hearings[stage_col].value_counts().reset_index()
             stage_counts.columns = ["Stage", "Count"]
                 not_adjourned = total_hearings - adjourned
                 outcome_df = pd.DataFrame(
+                    {
+                        "Outcome": ["ADJOURNED", "NOT ADJOURNED"],
+                        "Count": [adjourned, not_adjourned],
+                    }
                 )
                 fig_pie = px.pie(
                     names="Outcome",
                     title=f"Outcome Distribution (Total: {total_hearings:,})",
                     color="Outcome",
+                    color_discrete_map={
+                        "ADJOURNED": "#ef4444",
+                        "NOT ADJOURNED": "#22c55e",
+                    },
                 )
                 fig_pie.update_layout(height=400)
                 st.plotly_chart(fig_pie, use_container_width=True)
                 st.markdown("**By Stage**")
                 adj_by_stage = (
                     filtered_hearings.groupby(stage_col)["Outcome"]
+                    .apply(
+                        lambda x: (x == "ADJOURNED").sum() / len(x) if len(x) > 0 else 0
+                    )
                     .reset_index()
                 )
                 adj_by_stage.columns = ["Stage", "Rate"]
     with sub_tab4:
         st.markdown("#### Raw Data")
+        data_view = st.radio(
+            "Select data to view:", ["Cases", "Hearings"], horizontal=True
+        )
         if data_view == "Cases":
             st.dataframe(
                 height=600,
             )
+            st.markdown(
+                f"**Showing first 500 of {len(filtered_cases):,} filtered cases**"
+            )
             # Download button
             csv = filtered_cases.to_csv(index=False).encode("utf-8")
                 height=600,
             )
+            st.markdown(
+                f"**Showing first 500 of {len(filtered_hearings):,} filtered hearings**"
+            )
             # Download button
             csv = filtered_hearings.to_csv(index=False).encode("utf-8")
         st.markdown("#### Case Types")
         if "case_types" in params and params["case_types"]:
             case_types_df = pd.DataFrame(
+                {
+                    "Case Type": params["case_types"],
+                    "Index": range(len(params["case_types"])),
+                }
             )
             st.dataframe(case_types_df, use_container_width=True, hide_index=True)
             st.caption(f"Total: {len(params['case_types'])} case types")
                     with st.expander(f"From: {stage}"):
                         trans_df = pd.DataFrame(transitions)
                         if not trans_df.empty:
+                            st.dataframe(
+                                trans_df, use_container_width=True, hide_index=True
+                            )
+            st.caption(
+                f"Total: {len(params['stage_graph'])} stages with transition data"
+            )
         else:
             st.info("No stage transition data found")
             # Create heatmap
             adj_stats = params["adjournment_stats"]
+            stages_list = list(adj_stats.keys())[
+                :20
+            ]  # Limit to 20 stages for readability
+            case_types_list = params.get("case_types", [])[
+                :15
+            ]  # Limit to 15 case types
             if stages_list and case_types_list:
                 heatmap_data = []
         """)
         config_tab1, config_tab2, config_tab3, config_tab4 = st.tabs(
+            [
+                "EDA Parameters",
+                "Ripeness Classifier",
+                "Case Generator",
+                "Simulation Defaults",
+            ]
         )
         with config_tab1:
                 from scheduler.data.config import MONTHLY_SEASONALITY
                 season_df = pd.DataFrame(
+                    [
+                        {"Month": i, "Factor": MONTHLY_SEASONALITY.get(i, 1.0)}
+                        for i in range(1, 13)
+                    ]
                 )
                 st.dataframe(season_df, use_container_width=True, hide_index=True)
                 st.caption("1.0 = average, >1.0 = more cases, <1.0 = fewer cases")
                 """,
                     language="text",
                 )
+                st.caption(
+                    "Early ADMISSION: 40% bottleneck, Advanced stages: mostly ripe"
+                )
         with config_tab4:
             st.markdown("#### Simulation Defaults")
                 st.markdown("**Courtroom Capacity**")
                 if params and "court_capacity_global" in params:
                     cap = params["court_capacity_global"]
+                    st.metric(
+                        "Median slots/day", f"{cap.get('slots_median_global', 151):.0f}"
+                    )
+                    st.metric(
+                        "P90 slots/day", f"{cap.get('slots_p90_global', 200):.0f}"
+                    )
                 else:
                     st.info("Run EDA to load capacity statistics")

scheduler/dashboard/pages/2_Ripeness_Classifier.py CHANGED Viewed

@@ -99,7 +99,9 @@ RipenessClassifier.set_thresholds(
 )
 # Main content
-tab1, tab2, tab3 = st.tabs(["Current Configuration", "Interactive Testing", "Batch Classification"])
 with tab1:
     st.markdown("### Current Classifier Configuration")
@@ -153,7 +155,10 @@ with tab1:
     stage_rules = {
         "PRE-TRIAL": {"min_days": 60, "keywords": ["affidavit filed", "reply filed"]},
         "TRIAL": {"min_days": 45, "keywords": ["evidence complete", "cross complete"]},
-        "POST-TRIAL": {"min_days": 30, "keywords": ["arguments complete", "written note"]},
         "FINAL DISPOSAL": {"min_days": 15, "keywords": ["disposed", "judgment"]},
     }
@@ -190,8 +195,12 @@ with tab2:
         service_hearings_count = st.number_input(
             "Service Hearings", min_value=0, max_value=20, value=3
         )
-        days_in_stage = st.number_input("Days in Stage", min_value=0, max_value=365, value=45)
-        case_age = st.number_input("Case Age (days)", min_value=0, max_value=3650, value=120)
     # Keywords
     has_keywords = st.multiselect(
@@ -213,7 +222,7 @@ with tab2:
         test_case = Case(
             case_id=case_id,
-            case_type=case_type,  # Use string directly instead of CaseType enum
             filed_date=filed_date,
             current_stage=case_stage,
             status=CaseStatus.PENDING,
@@ -286,15 +295,25 @@ with tab3:
                     with col1:
                         pct = classifications["RIPE"] / len(cases) * 100
-                        st.metric("RIPE Cases", f"{classifications['RIPE']:,}", f"{pct:.1f}%")
                     with col2:
                         pct = classifications["UNKNOWN"] / len(cases) * 100
-                        st.metric("UNKNOWN Cases", f"{classifications['UNKNOWN']:,}", f"{pct:.1f}%")
                     with col3:
                         pct = classifications["UNRIPE"] / len(cases) * 100
-                        st.metric("UNRIPE Cases", f"{classifications['UNRIPE']:,}", f"{pct:.1f}%")
                     # Pie chart
                     fig = px.pie(
@@ -302,7 +321,11 @@ with tab3:
                         names=list(classifications.keys()),
                         title="Classification Distribution",
                         color=list(classifications.keys()),
-                        color_discrete_map={"RIPE": "green", "UNKNOWN": "orange", "UNRIPE": "red"},
                     )
                     st.plotly_chart(fig, use_container_width=True)
@@ -311,4 +334,6 @@ with tab3:
 # Footer
 st.markdown("---")
-st.markdown("*Adjust thresholds in the sidebar to see real-time impact on classification*")

 )
 # Main content
+tab1, tab2, tab3 = st.tabs(
+    ["Current Configuration", "Interactive Testing", "Batch Classification"]
+)
 with tab1:
     st.markdown("### Current Classifier Configuration")
     stage_rules = {
         "PRE-TRIAL": {"min_days": 60, "keywords": ["affidavit filed", "reply filed"]},
         "TRIAL": {"min_days": 45, "keywords": ["evidence complete", "cross complete"]},
+        "POST-TRIAL": {
+            "min_days": 30,
+            "keywords": ["arguments complete", "written note"],
+        },
         "FINAL DISPOSAL": {"min_days": 15, "keywords": ["disposed", "judgment"]},
     }
         service_hearings_count = st.number_input(
             "Service Hearings", min_value=0, max_value=20, value=3
         )
+        days_in_stage = st.number_input(
+            "Days in Stage", min_value=0, max_value=365, value=45
+        )
+        case_age = st.number_input(
+            "Case Age (days)", min_value=0, max_value=3650, value=120
+        )
     # Keywords
     has_keywords = st.multiselect(
         test_case = Case(
             case_id=case_id,
+            case_type=case_type,
             filed_date=filed_date,
             current_stage=case_stage,
             status=CaseStatus.PENDING,
                     with col1:
                         pct = classifications["RIPE"] / len(cases) * 100
+                        st.metric(
+                            "RIPE Cases", f"{classifications['RIPE']:,}", f"{pct:.1f}%"
+                        )
                     with col2:
                         pct = classifications["UNKNOWN"] / len(cases) * 100
+                        st.metric(
+                            "UNKNOWN Cases",
+                            f"{classifications['UNKNOWN']:,}",
+                            f"{pct:.1f}%",
+                        )
                     with col3:
                         pct = classifications["UNRIPE"] / len(cases) * 100
+                        st.metric(
+                            "UNRIPE Cases",
+                            f"{classifications['UNRIPE']:,}",
+                            f"{pct:.1f}%",
+                        )
                     # Pie chart
                     fig = px.pie(
                         names=list(classifications.keys()),
                         title="Classification Distribution",
                         color=list(classifications.keys()),
+                        color_discrete_map={
+                            "RIPE": "green",
+                            "UNKNOWN": "orange",
+                            "UNRIPE": "red",
+                        },
                     )
                     st.plotly_chart(fig, use_container_width=True)
 # Footer
 st.markdown("---")
+st.markdown(
+    "*Adjust thresholds in the sidebar to see real-time impact on classification*"
+)