Spaces:

buckeyeguy
/

osc-usage-dashboard

Sleeping

App Files Files Community

buckeyeguy commited on Apr 23

Commit

ecc00b8

verified ·

1 Parent(s): 53fe9eb

Consolidate dashboard to single app.py

Browse files

Files changed (10) hide show

.ruff_cache/.gitignore +2 -0
.ruff_cache/0.15.2/10572574500376801884 +0 -0
.ruff_cache/0.15.2/11548578324518120789 +0 -0
.ruff_cache/CACHEDIR.TAG +1 -0
__pycache__/app.cpython-312.pyc +0 -0
__pycache__/charts.cpython-312.pyc +0 -0
__pycache__/components.cpython-312.pyc +0 -0
__pycache__/config.cpython-312.pyc +0 -0
__pycache__/data_loader.cpython-312.pyc +0 -0
app.py +252 -284

.ruff_cache/.gitignore ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ # Automatically created by ruff.
2	+ *

.ruff_cache/0.15.2/10572574500376801884 ADDED Viewed

Binary file (197 Bytes). View file

.ruff_cache/0.15.2/11548578324518120789 ADDED Viewed

Binary file (62 Bytes). View file

.ruff_cache/CACHEDIR.TAG ADDED Viewed

	@@ -0,0 +1 @@


1	+ Signature: 8a477f597d28d172789f06886806bc55

__pycache__/app.cpython-312.pyc ADDED Viewed

Binary file (13.1 kB). View file

__pycache__/charts.cpython-312.pyc ADDED Viewed

Binary file (7.23 kB). View file

__pycache__/components.cpython-312.pyc ADDED Viewed

Binary file (710 Bytes). View file

__pycache__/config.cpython-312.pyc ADDED Viewed

Binary file (625 Bytes). View file

__pycache__/data_loader.cpython-312.pyc ADDED Viewed

Binary file (2.08 kB). View file

app.py CHANGED Viewed

@@ -1,363 +1,331 @@
-"""OSC Usage Dashboard — Streamlit app with Plotly charts, organized in tabs."""
 from __future__ import annotations
 from datetime import date, datetime, timedelta
 import streamlit as st
-from charts import (
-    chart_budget_gauge,
-    chart_burn_rate,
-    chart_daily_usage,
-    chart_dollars_by_user,
-    chart_duration_distribution,
-    chart_efficiency_scatter,
-    chart_job_outcomes,
-    chart_launch_method_count,
-    chart_launch_method_dollars,
-    chart_outcome_breakdown,
-    chart_queue_efficiency,
-    chart_resource_sizing,
-    chart_spend_by_outcome,
-    chart_usage_by_system,
-)
-from config import ALLOCATIONS, INTERACTIVE_METHODS, PROJECT_CODES
-from data_loader import filter_jobs, load_data
 st.set_page_config(page_title="OSC Usage Dashboard", layout="wide")
-# --- Load data ---
 jobs, snapshots, metadata = load_data()
-# --- Sidebar ---
 with st.sidebar:
     st.title("OSC Usage Dashboard")
-    # Freshness badge
     pushed_at = metadata.get("pushed_at", "")
     if pushed_at:
-        pushed_dt = datetime.fromisoformat(pushed_at)
-        age = datetime.now() - pushed_dt
         if age > timedelta(hours=24):
-            st.warning(f"Data is {age.days}d {age.seconds // 3600}h old")
         else:
             st.success(f"Updated {pushed_at[:16]}")
-    else:
-        st.info("No timestamp in metadata")
     if st.button("Reload Data"):
         st.cache_data.clear()
         st.rerun()
     st.divider()
-    # Date range
     all_dates = jobs["end_date"].dropna()
-    if not all_dates.empty:
-        min_date = all_dates.min()
-        max_date = all_dates.max()
-    else:
-        min_date = date(2024, 7, 1)
-        max_date = date.today()
     date_range = st.date_input(
-        "Date Range",
-        value=(min_date, max_date),
-        min_value=min_date,
-        max_value=max_date,
     )
-    if isinstance(date_range, tuple) and len(date_range) == 2:
-        date_filter = date_range
-    else:
-        date_filter = (min_date, max_date)
-    # Project filter
-    all_projects = sorted(jobs["project_code"].dropna().unique().tolist())
-    selected_projects = st.multiselect("Projects", all_projects, default=all_projects)
-    # User filter
-    all_users = sorted(jobs["username"].dropna().unique().tolist())
-    selected_users = st.multiselect("Users", all_users, default=all_users)
-    # System filter
-    all_systems = sorted(jobs["system_code"].dropna().unique().tolist())
-    selected_systems = st.multiselect("Systems", all_systems, default=all_systems)
-# --- Apply filters ---
-filtered = filter_jobs(
-    jobs,
-    date_range=date_filter,
-    projects=selected_projects,
-    users=selected_users,
-    systems=selected_systems,
-)
-# --- Metric cards (always visible above tabs) ---
 total_spend = filtered["dollars_used"].sum()
-total_jobs = len(filtered)
-# Batch completion %
-is_batch = ~filtered["launch_method"].isin(INTERACTIVE_METHODS)
-batch_jobs = filtered[is_batch]
-batch_total = len(batch_jobs)
-batch_completed = (batch_jobs["last_state"] == "COMPLETED").sum()
-batch_completion_pct = batch_completed / batch_total * 100 if batch_total > 0 else 0
-# Interactive spend %
-interactive_dollars = filtered[filtered["launch_method"].isin(INTERACTIVE_METHODS)][
-    "dollars_used"
 ].sum()
-interactive_pct = interactive_dollars / total_spend * 100 if total_spend > 0 else 0
 m1, m2, m3, m4 = st.columns(4)
-m1.metric("Total Spend", f"${total_spend:,.2f}", help="Sum of all job costs in the filtered period")
-m2.metric("Total Jobs", f"{total_jobs:,}", help="Number of jobs in the filtered period")
-m3.metric(
-    "Batch Completion %",
-    f"{batch_completion_pct:.1f}%",
-    help="% of batch jobs that completed successfully (interactive sessions excluded — they never exit as COMPLETED)",
-)
 m4.metric(
-    "Interactive Spend %",
-    f"{interactive_pct:.1f}%",
-    help="% of total dollars spent on interactive sessions (Jupyter, Desktop, Code Server, etc.)",
 )
 st.divider()
-# --- 5 tabs ---
 tab_overview, tab_spend, tab_health, tab_user, tab_data = st.tabs(
     ["Overview", "Spend Analysis", "Job Health", "User Detail", "Raw Data"]
 )
-# === Overview tab ===
 with tab_overview:
-    # Budget gauges per project
-    gauge_cols = st.columns(len(PROJECT_CODES))
-    for col, proj in zip(gauge_cols, PROJECT_CODES):
         with col:
-            proj_spend = filtered.loc[filtered["project_code"] == proj, "dollars_used"].sum()
             alloc = ALLOCATIONS.get(proj, 0)
             if alloc > 0:
-                fig = chart_budget_gauge(proj, proj_spend, alloc)
                 st.plotly_chart(fig, use_container_width=True)
-            else:
-                st.metric(proj, f"${proj_spend:,.2f}", help="No allocation data")
-    # Per-project balance from snapshots
-    latest_snapshots = snapshots.sort_values("snapshot_date").groupby("project_code").last()
-    snap_cols = st.columns(len(PROJECT_CODES))
-    for col, proj in zip(snap_cols, PROJECT_CODES):
         with col:
-            if proj in latest_snapshots.index:
-                row = latest_snapshots.loc[proj]
-                balance = row.get("current_balance", None)
-                balance_str = f"${balance:,.2f}" if balance is not None else "N/A"
-                proj_spend = filtered.loc[filtered["project_code"] == proj, "dollars_used"].sum()
                 st.metric(
                     f"{proj} Balance",
-                    balance_str,
-                    delta=f"-${proj_spend:,.2f} spent",
                     delta_color="inverse",
                 )
-    # Burn rate (full width)
-    fig = chart_burn_rate(filtered)
-    if fig:
         st.plotly_chart(fig, use_container_width=True)
-# === Spend Analysis tab ===
 with tab_spend:
     left, right = st.columns(2)
     with left:
-        fig = chart_usage_by_system(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
     with right:
-        fig = chart_dollars_by_user(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    left2, right2 = st.columns(2)
-    with left2:
-        fig = chart_launch_method_dollars(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    with right2:
-        fig = chart_launch_method_count(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    # Daily usage (full width with range slider)
-    fig = chart_daily_usage(filtered)
-    if fig:
-        st.plotly_chart(fig, use_container_width=True)
-# === Job Health tab ===
 with tab_health:
     left, right = st.columns(2)
     with left:
-        fig = chart_job_outcomes(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
     with right:
-        fig = chart_spend_by_outcome(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    left2, right2 = st.columns(2)
-    with left2:
-        fig = chart_outcome_breakdown(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    with right2:
-        fig = chart_efficiency_scatter(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    left3, right3 = st.columns(2)
-    with left3:
-        fig = chart_queue_efficiency(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    with right3:
-        fig = chart_duration_distribution(filtered)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-    # Resource sizing (full width)
-    fig = chart_resource_sizing(filtered)
-    if fig:
-        st.plotly_chart(fig, use_container_width=True)
-# === User Detail tab ===
 with tab_user:
-    users_in_data = sorted(filtered["username"].dropna().unique().tolist())
     if not users_in_data:
         st.info("No users in filtered data.")
     else:
-        selected_user = st.selectbox("Select User", users_in_data)
-        user_df = filtered[filtered["username"] == selected_user]
-        # User metric cards
-        u_spend = user_df["dollars_used"].sum()
-        u_jobs = len(user_df)
-        u_batch = user_df[~user_df["launch_method"].isin(INTERACTIVE_METHODS)]
-        u_batch_total = len(u_batch)
-        u_batch_completed = (u_batch["last_state"] == "COMPLETED").sum()
-        u_batch_pct = u_batch_completed / u_batch_total * 100 if u_batch_total > 0 else 0
-        um1, um2, um3 = st.columns(3)
-        um1.metric("User Spend", f"${u_spend:,.2f}")
-        um2.metric("User Jobs", f"{u_jobs:,}")
-        um3.metric("Batch Completion %", f"{u_batch_pct:.1f}%")
-        # User charts
         left, right = st.columns(2)
         with left:
-            fig = chart_outcome_breakdown(user_df)
-            if fig:
-                st.plotly_chart(fig, use_container_width=True)
-        with right:
-            fig = chart_efficiency_scatter(user_df)
-            if fig:
-                st.plotly_chart(fig, use_container_width=True)
-        left2, right2 = st.columns(2)
-        with left2:
-            fig = chart_launch_method_dollars(user_df)
-            if fig:
-                st.plotly_chart(fig, use_container_width=True)
-        with right2:
-            fig = chart_resource_sizing(user_df)
-            if fig:
-                st.plotly_chart(fig, use_container_width=True)
-        # Daily usage (full width)
-        fig = chart_daily_usage(user_df)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-        # Duration distribution (full width)
-        fig = chart_duration_distribution(user_df)
-        if fig:
-            st.plotly_chart(fig, use_container_width=True)
-        # User job table
-        st.subheader(f"{selected_user}'s Jobs ({u_jobs:,} rows)")
-        display_cols = [
-            c
-            for c in [
-                "job_id",
-                "project_code",
-                "system_code",
-                "queue_name",
-                "launch_method",
-                "last_state",
-                "outcome_category",
-                "walltime_hours",
-                "dollars_used",
-                "end_time",
-            ]
-            if c in user_df.columns
-        ]
-        user_display = user_df[display_cols].sort_values("end_time", ascending=False)
-        col_config = {}
-        if "dollars_used" in user_display.columns:
-            col_config["dollars_used"] = st.column_config.NumberColumn("Cost ($)", format="$%.2f")
-        if "walltime_hours" in user_display.columns:
-            col_config["walltime_hours"] = st.column_config.NumberColumn(
-                "Walltime (hrs)", format="%.1f"
             )
-        st.dataframe(
-            user_display, use_container_width=True, column_config=col_config, hide_index=True
         )
-# === Raw Data tab ===
 with tab_data:
     st.subheader(f"Filtered Jobs ({len(filtered):,} rows)")
-    # Format for display
-    display_cols = [
-        c
-        for c in [
-            "job_id",
-            "username",
-            "project_code",
-            "system_code",
-            "queue_name",
-            "launch_method",
-            "last_state",
-            "outcome_category",
-            "walltime_hours",
-            "dollars_used",
-            "submit_time",
-            "start_time",
-            "end_time",
-        ]
-        if c in filtered.columns
-    ]
-    display_df = filtered[display_cols].copy()
-    # Format columns for readability
-    col_config = {}
-    if "dollars_used" in display_df.columns:
-        col_config["dollars_used"] = st.column_config.NumberColumn("Cost ($)", format="$%.2f")
-    if "walltime_hours" in display_df.columns:
-        col_config["walltime_hours"] = st.column_config.NumberColumn(
-            "Walltime (hrs)", format="%.1f"
-        )
-    st.dataframe(display_df, use_container_width=True, column_config=col_config, hide_index=True)
-    # Download button
-    csv = filtered[display_cols].to_csv(index=False)
     st.download_button(
-        label="Download filtered data as CSV",
-        data=csv,
-        file_name="osc_usage_filtered.csv",
-        mime="text/csv",
     )
 st.caption(f"Data from OSCusage CLI | {metadata.get('job_count', '?')} jobs in dataset")

+"""OSC Usage Dashboard."""
 from __future__ import annotations
+import json
 from datetime import date, datetime, timedelta
+from pathlib import Path
+import pandas as pd
+import plotly.express as px
+import plotly.graph_objects as go
 import streamlit as st
+from huggingface_hub import snapshot_download
+DATASET_REPO = "buckeyeguy/osc-usage-data"
+PROJECT_CODES = ["PAS1266", "PAS3209"]
+ALLOCATIONS = {"PAS1266": 2257.0, "PAS3209": 1211.0}
+INTERACTIVE_METHODS = frozenset({"Jupyter", "Desktop", "Code Server", "MATLAB", "MLflow"})
 st.set_page_config(page_title="OSC Usage Dashboard", layout="wide")
+@st.cache_data(ttl=300)
+def load_data():
+    snap = Path(snapshot_download(repo_id=DATASET_REPO, repo_type="dataset"))
+    jobs = pd.read_parquet(snap / "jobs.parquet")
+    snapshots = pd.read_parquet(snap / "snapshots.parquet")
+    metadata = json.loads((snap / "metadata.json").read_text())
+    for col in ["submit_time", "start_time", "end_time"]:
+        if col in jobs.columns:
+            jobs[col] = pd.to_datetime(jobs[col])
+    return jobs, snapshots, metadata
+def chart(df, kind="histogram", **kwargs):
+    if df.empty:
+        return
+    st.plotly_chart(getattr(px, kind)(df, **kwargs), use_container_width=True)
+def agg(df, by, value="dollars_used"):
+    """Sum-by-group stat. Pre-aggregates so we can use px.bar (geom) instead of px.histogram (stat)."""
+    return df.groupby(by, dropna=False)[value].sum().reset_index()
+def daily(df, by):
+    return (
+        df.dropna(subset=["end_date"]).groupby(["end_date", by])["dollars_used"].sum().reset_index()
+    )
+def runtime_vs_cost(df):
+    chart(
+        df[(df["walltime_hours"] > 0) & (df["dollars_used"] > 0)],
+        "scatter",
+        x="walltime_hours",
+        y="dollars_used",
+        color="outcome_category",
+        log_x=True,
+        log_y=True,
+        opacity=0.5,
+        title="Runtime vs Cost",
+    )
+# --- Load + Sidebar ---
 jobs, snapshots, metadata = load_data()
 with st.sidebar:
     st.title("OSC Usage Dashboard")
     pushed_at = metadata.get("pushed_at", "")
     if pushed_at:
+        age = datetime.now() - datetime.fromisoformat(pushed_at)
         if age > timedelta(hours=24):
+            st.warning(f"Data is {age.days}d old")
         else:
             st.success(f"Updated {pushed_at[:16]}")
     if st.button("Reload Data"):
         st.cache_data.clear()
         st.rerun()
     st.divider()
     all_dates = jobs["end_date"].dropna()
+    min_date, max_date = (
+        (all_dates.min(), all_dates.max())
+        if not all_dates.empty
+        else (date(2024, 7, 1), date.today())
+    )
     date_range = st.date_input(
+        "Date Range", value=(min_date, max_date), min_value=min_date, max_value=max_date
     )
+    date_filter = (
+        date_range
+        if isinstance(date_range, tuple) and len(date_range) == 2
+        else (min_date, max_date)
+    )
+    selections = {}
+    for label, col in [
+        ("Projects", "project_code"),
+        ("Users", "username"),
+        ("Systems", "system_code"),
+    ]:
+        opts = sorted(jobs[col].dropna().unique())
+        selections[col] = st.multiselect(label, opts, default=opts)
+filtered = jobs[
+    jobs["end_date"].between(date_filter[0], date_filter[1])
+    & jobs["project_code"].isin(selections["project_code"])
+    & jobs["username"].isin(selections["username"])
+    & jobs["system_code"].isin(selections["system_code"])
+]
+# --- Metric Cards ---
 total_spend = filtered["dollars_used"].sum()
+batch = filtered[~filtered["launch_method"].isin(INTERACTIVE_METHODS)]
+interactive_dollars = filtered.loc[
+    filtered["launch_method"].isin(INTERACTIVE_METHODS), "dollars_used"
 ].sum()
 m1, m2, m3, m4 = st.columns(4)
+m1.metric("Total Spend", f"${total_spend:,.2f}")
+m2.metric("Total Jobs", f"{len(filtered):,}")
+m3.metric("Batch Completion %", f"{(batch['last_state'] == 'COMPLETED').mean() * 100:.1f}%")
 m4.metric(
+    "Interactive Spend %", f"{interactive_dollars / total_spend * 100 if total_spend else 0:.1f}%"
 )
 st.divider()
+# --- Tabs ---
 tab_overview, tab_spend, tab_health, tab_user, tab_data = st.tabs(
     ["Overview", "Spend Analysis", "Job Health", "User Detail", "Raw Data"]
 )
 with tab_overview:
+    for col, proj in zip(st.columns(len(PROJECT_CODES)), PROJECT_CODES):
         with col:
+            ps = filtered.loc[filtered["project_code"] == proj, "dollars_used"].sum()
             alloc = ALLOCATIONS.get(proj, 0)
             if alloc > 0:
+                mx = max(alloc * 1.2, ps)
+                fig = go.Figure(
+                    go.Indicator(
+                        mode="gauge+number",
+                        value=ps,
+                        number={"prefix": "$", "valueformat": ",.0f"},
+                        title={"text": proj},
+                        gauge={
+                            "axis": {"range": [0, mx], "tickprefix": "$"},
+                            "bar": {"color": px.colors.qualitative.Plotly[0]},
+                            "steps": [
+                                {"range": [0, alloc * 0.7], "color": "#D4EDDA"},
+                                {"range": [alloc * 0.7, alloc * 0.9], "color": "#FFF3CD"},
+                                {"range": [alloc * 0.9, mx], "color": "#F8D7DA"},
+                            ],
+                            "threshold": {
+                                "line": {"color": "red", "width": 3},
+                                "thickness": 0.75,
+                                "value": alloc,
+                            },
+                        },
+                    )
+                )
+                fig.update_layout(height=250, margin=dict(t=60, b=20, l=30, r=30))
                 st.plotly_chart(fig, use_container_width=True)
+    latest = snapshots.sort_values("snapshot_date").groupby("project_code").last()
+    for col, proj in zip(st.columns(len(PROJECT_CODES)), PROJECT_CODES):
         with col:
+            if proj in latest.index:
+                bal = latest.loc[proj].get("current_balance")
+                ps = filtered.loc[filtered["project_code"] == proj, "dollars_used"].sum()
                 st.metric(
                     f"{proj} Balance",
+                    f"${bal:,.2f}" if bal is not None else "N/A",
+                    delta=f"-${ps:,.2f} spent",
                     delta_color="inverse",
                 )
+    burn = daily(filtered, "project_code")
+    burn["cumulative"] = burn.groupby("project_code")["dollars_used"].cumsum()
+    if not burn.empty:
+        fig = px.area(
+            burn, x="end_date", y="cumulative", color="project_code", title="Budget Burn Rate"
+        )
+        fig.update_yaxes(tickprefix="$")
+        for proj, alloc in ALLOCATIONS.items():
+            fig.add_hline(y=alloc, line_dash="dot", annotation_text=f"{proj}: ${alloc:,.0f}")
         st.plotly_chart(fig, use_container_width=True)
 with tab_spend:
     left, right = st.columns(2)
     with left:
+        chart(
+            agg(filtered, ["system_code", "subtype_code"]),
+            "bar",
+            x="system_code",
+            y="dollars_used",
+            color="subtype_code",
+            barmode="group",
+            title="Usage by System",
+        )
     with right:
+        chart(filtered, "pie", names="username", values="dollars_used", title="Dollars by User")
+    left, right = st.columns(2)
+    with left:
+        chart(
+            agg(filtered, ["project_code", "launch_method"]),
+            "bar",
+            x="project_code",
+            y="dollars_used",
+            color="launch_method",
+            title="Spend by Launch Method",
+        )
+    with right:
+        chart(
+            filtered,
+            "histogram",
+            x="project_code",
+            color="launch_method",
+            barmode="stack",
+            title="Jobs by Launch Method",
+        )
+    chart(
+        daily(filtered, "system_code"),
+        "line",
+        x="end_date",
+        y="dollars_used",
+        color="system_code",
+        markers=True,
+        title="Daily Usage",
+    )
 with tab_health:
     left, right = st.columns(2)
     with left:
+        chart(
+            filtered.dropna(subset=["end_month"]),
+            "histogram",
+            x="end_month",
+            color="last_state",
+            barmode="stack",
+            title="Job Outcomes by Month",
+        )
     with right:
+        chart(
+            agg(filtered, ["outcome_category", "project_code"]),
+            "bar",
+            x="outcome_category",
+            y="dollars_used",
+            color="project_code",
+            barmode="group",
+            title="Spend by Outcome",
+        )
+    queue_cost = (
+        filtered.groupby("queue_name")
+        .agg(n=("job_id", "count"), avg_cost=("dollars_used", "mean"))
+        .reset_index()
+        .query("n >= 10")
+        .sort_values("avg_cost", ascending=False)
+    )
+    if not queue_cost.empty:
+        chart(
+            queue_cost,
+            "bar",
+            x="queue_name",
+            y="avg_cost",
+            text="n",
+            title="Avg Cost per Job by Queue (n≥10)",
+        )
+    left, right = st.columns(2)
+    with left:
+        chart(
+            filtered[filtered["walltime_hours"] > 0],
+            "histogram",
+            x="walltime_hours",
+            color="outcome_category",
+            nbins=30,
+            title="Duration Distribution",
+        )
+    with right:
+        runtime_vs_cost(filtered)
 with tab_user:
+    users_in_data = sorted(filtered["username"].dropna().unique())
     if not users_in_data:
         st.info("No users in filtered data.")
     else:
+        user = st.selectbox("Select User", users_in_data)
+        udf = filtered[filtered["username"] == user]
+        ub = udf[~udf["launch_method"].isin(INTERACTIVE_METHODS)]
+        m1, m2, m3 = st.columns(3)
+        m1.metric("Spend", f"${udf['dollars_used'].sum():,.2f}")
+        m2.metric("Jobs", f"{len(udf):,}")
+        m3.metric(
+            "Batch Completion %",
+            f"{(ub['last_state'] == 'COMPLETED').mean() * 100:.1f}%" if len(ub) else "N/A",
+        )
         left, right = st.columns(2)
         with left:
+            chart(
+                agg(udf, ["launch_method", "outcome_category"]),
+                "bar",
+                x="launch_method",
+                y="dollars_used",
+                color="outcome_category",
+                title="Spend by Method & Outcome",
             )
+        with right:
+            runtime_vs_cost(udf)
+        chart(
+            daily(udf, "system_code"),
+            "line",
+            x="end_date",
+            y="dollars_used",
+            color="system_code",
+            markers=True,
+            title="Daily Usage",
         )
 with tab_data:
     st.subheader(f"Filtered Jobs ({len(filtered):,} rows)")
+    st.dataframe(filtered, use_container_width=True, hide_index=True)
     st.download_button(
+        "Download CSV", filtered.to_csv(index=False), "osc_usage_filtered.csv", "text/csv"
     )
 st.caption(f"Data from OSCusage CLI | {metadata.get('job_count', '?')} jobs in dataset")