Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -3,7 +3,7 @@ import pandas as pd
|
|
| 3 |
import plotly.express as px
|
| 4 |
import plotly.graph_objects as go
|
| 5 |
import numpy as np
|
| 6 |
-
from datetime import datetime
|
| 7 |
|
| 8 |
# 1. PAGE CONFIGURATION
|
| 9 |
st.set_page_config(
|
|
@@ -13,350 +13,245 @@ st.set_page_config(
|
|
| 13 |
initial_sidebar_state="expanded"
|
| 14 |
)
|
| 15 |
|
| 16 |
-
# 2. PROFESSIONAL STYLING (
|
| 17 |
st.markdown("""
|
| 18 |
<style>
|
| 19 |
-
@import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&display=swap');
|
|
|
|
| 20 |
|
| 21 |
-
.stApp {
|
| 22 |
-
background-color: #f8fafc;
|
| 23 |
-
color: #0f172a;
|
| 24 |
-
font-family: 'Inter', sans-serif;
|
| 25 |
-
}
|
| 26 |
-
|
| 27 |
/* METRIC CARDS */
|
| 28 |
div[data-testid="stMetric"] {
|
| 29 |
-
background
|
| 30 |
-
border: 1px solid #e2e8f0;
|
| 31 |
-
|
| 32 |
-
padding: 15px;
|
| 33 |
-
box-shadow: 0 4px 6px -1px rgba(0, 0, 0, 0.1);
|
| 34 |
-
}
|
| 35 |
-
div[data-testid="stMetricValue"] {
|
| 36 |
-
color: #0f172a !important;
|
| 37 |
-
font-weight: 700 !important;
|
| 38 |
}
|
| 39 |
-
div[data-testid="
|
| 40 |
-
|
| 41 |
-
}
|
| 42 |
-
|
| 43 |
/* DATAFRAME */
|
| 44 |
-
div[data-testid="stDataFrame"]
|
| 45 |
-
|
| 46 |
-
background
|
| 47 |
-
|
| 48 |
-
div[data-testid="stDataFrame"] div[role="columnheader"] {
|
| 49 |
-
color: #0f172a !important;
|
| 50 |
-
font-weight: 600 !important;
|
| 51 |
-
background-color: #f1f5f9 !important;
|
| 52 |
}
|
| 53 |
-
|
| 54 |
/* SIDEBAR */
|
| 55 |
-
[data-testid="stSidebar"] {
|
| 56 |
-
|
| 57 |
-
}
|
| 58 |
-
[data-testid="stSidebar"] * {
|
| 59 |
-
color: #f8fafc !important;
|
| 60 |
-
}
|
| 61 |
-
[data-testid="stSidebar"] .stSelectbox label,
|
| 62 |
-
[data-testid="stSidebar"] .stMultiSelect label {
|
| 63 |
-
color: #94a3b8 !important;
|
| 64 |
-
}
|
| 65 |
-
|
| 66 |
-
h1, h2, h3 { color: #0f172a !important; font-weight: 700 !important; }
|
| 67 |
|
| 68 |
-
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
font-weight: 600;
|
| 75 |
-
}
|
| 76 |
-
.bg-red { background-color: #fee2e2; color: #991b1b; }
|
| 77 |
-
.bg-green { background-color: #dcfce7; color: #166534; }
|
| 78 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 79 |
.js-plotly-plot .plotly .main-svg { background-color: rgba(0,0,0,0) !important; }
|
| 80 |
</style>
|
| 81 |
""", unsafe_allow_html=True)
|
| 82 |
|
| 83 |
-
# 3.
|
| 84 |
-
@st.cache_data
|
| 85 |
def load_data():
|
| 86 |
try:
|
| 87 |
df = pd.read_csv('analyzed_aadhaar_data.csv')
|
|
|
|
| 88 |
except FileNotFoundError:
|
| 89 |
-
|
| 90 |
-
|
| 91 |
-
districts = ['North District', 'South Region', 'East Zone', 'West End', 'Central Hub',
|
| 92 |
-
|
| 93 |
df = pd.DataFrame({
|
| 94 |
-
'date': dates,
|
| 95 |
-
'state': np.random.choice([
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
'
|
| 101 |
-
'
|
| 102 |
-
'
|
|
|
|
|
|
|
|
|
|
|
|
|
| 103 |
})
|
| 104 |
|
| 105 |
-
if 'date' in df.columns:
|
| 106 |
-
df['date'] = pd.to_datetime(df['date'])
|
| 107 |
|
| 108 |
-
#
|
| 109 |
state_centers = {
|
| 110 |
-
'Andaman and Nicobar Islands': (11.7401, 92.6586),
|
| 111 |
-
'
|
| 112 |
-
'
|
| 113 |
-
'
|
| 114 |
-
'
|
| 115 |
-
'
|
| 116 |
-
'
|
| 117 |
-
'
|
| 118 |
-
'
|
| 119 |
-
'
|
| 120 |
-
'
|
| 121 |
-
'
|
| 122 |
-
'Himachal Pradesh': (31.9579, 77.1095), # Corrected
|
| 123 |
-
'Jammu and Kashmir': (33.7782, 76.5762),
|
| 124 |
-
'Jharkhand': (23.6102, 85.2799),
|
| 125 |
-
'Karnataka': (15.3173, 75.7139),
|
| 126 |
-
'Kerala': (10.8505, 76.2711),
|
| 127 |
-
'Ladakh': (34.1526, 77.5770),
|
| 128 |
-
'Lakshadweep': (10.5667, 72.6417),
|
| 129 |
-
'Madhya Pradesh': (22.9734, 78.6569),
|
| 130 |
-
'Maharashtra': (19.7515, 75.7139),
|
| 131 |
-
'Manipur': (24.6637, 93.9063),
|
| 132 |
-
'Meghalaya': (25.4670, 91.3662),
|
| 133 |
-
'Mizoram': (23.1645, 92.9376),
|
| 134 |
-
'Nagaland': (26.1584, 94.5624),
|
| 135 |
-
'Odisha': (20.9517, 85.0985),
|
| 136 |
-
'Puducherry': (11.9416, 79.8083),
|
| 137 |
-
'Punjab': (31.1471, 75.3412),
|
| 138 |
-
'Rajasthan': (27.0238, 74.2179),
|
| 139 |
-
'Sikkim': (27.5330, 88.5122),
|
| 140 |
-
'Tamil Nadu': (11.1271, 78.6569),
|
| 141 |
-
'Telangana': (18.1124, 79.0193),
|
| 142 |
-
'Tripura': (23.9408, 91.9882),
|
| 143 |
-
'Uttar Pradesh': (26.8467, 80.9462),
|
| 144 |
-
'Uttarakhand': (30.0668, 79.0193),
|
| 145 |
-
'West Bengal': (22.9868, 87.8550)
|
| 146 |
}
|
| 147 |
|
| 148 |
-
#
|
| 149 |
-
# format: (lat_spread, lon_spread) in degrees
|
| 150 |
-
# This prevents "Thin" states from spilling into the ocean/neighbors
|
| 151 |
state_spreads = {
|
| 152 |
-
'Kerala': (1.2, 0.25),
|
| 153 |
-
'
|
| 154 |
-
'
|
| 155 |
-
'
|
| 156 |
-
'
|
| 157 |
-
'
|
| 158 |
-
'
|
| 159 |
-
'
|
| 160 |
-
'
|
| 161 |
-
'Gujarat': (1.0, 1.3),
|
| 162 |
-
'Rajasthan': (1.8, 1.8),
|
| 163 |
-
'Madhya Pradesh': (1.5, 2.0),
|
| 164 |
-
'Andaman and Nicobar Islands': (1.5, 0.2), # Archipelago (Tall)
|
| 165 |
-
'Himachal Pradesh': (0.5, 0.6)
|
| 166 |
}
|
| 167 |
|
| 168 |
-
default_spread = (0.6, 0.6)
|
| 169 |
-
|
| 170 |
def get_coords(row):
|
| 171 |
state = row.get('state', 'Delhi')
|
| 172 |
-
district = str(row.get('district', 'Unknown'))
|
| 173 |
-
|
| 174 |
base_lat, base_lon = state_centers.get(state, (20.5937, 78.9629))
|
| 175 |
-
lat_scale, lon_scale = state_spreads.get(state, default_spread)
|
| 176 |
-
|
| 177 |
-
# --- 3. SEMANTIC OFFSETTING ---
|
| 178 |
-
# If district name contains direction, bias the jitter
|
| 179 |
-
lat_bias, lon_bias = 0, 0
|
| 180 |
-
d_lower = district.lower()
|
| 181 |
-
|
| 182 |
-
# Bias factor (percent of scale)
|
| 183 |
-
bias_factor = 0.7
|
| 184 |
-
|
| 185 |
-
if 'north' in d_lower: lat_bias += lat_scale * bias_factor
|
| 186 |
-
if 'south' in d_lower: lat_bias -= lat_scale * bias_factor
|
| 187 |
-
if 'east' in d_lower: lon_bias += lon_scale * bias_factor
|
| 188 |
-
if 'west' in d_lower: lon_bias -= lon_scale * bias_factor
|
| 189 |
|
| 190 |
-
#
|
| 191 |
-
|
| 192 |
-
np.random.seed(district_hash % 2**32)
|
| 193 |
|
| 194 |
-
|
| 195 |
-
|
| 196 |
|
| 197 |
-
|
| 198 |
-
|
|
|
|
|
|
|
| 199 |
|
| 200 |
-
|
| 201 |
-
|
| 202 |
-
noise = 0.03
|
| 203 |
|
| 204 |
return pd.Series({
|
| 205 |
-
'lat': base_lat + lat_bias +
|
| 206 |
-
'lon': base_lon + lon_bias +
|
| 207 |
})
|
| 208 |
|
| 209 |
coords = df.apply(get_coords, axis=1)
|
| 210 |
-
df['lat'] = coords['lat']
|
| 211 |
-
df['
|
| 212 |
-
|
| 213 |
-
df['risk_category'] = pd.cut(
|
| 214 |
-
df['RISK_SCORE'],
|
| 215 |
-
bins=[-1, 50, 75, 85, 100],
|
| 216 |
-
labels=['Low', 'Medium', 'High', 'Critical']
|
| 217 |
-
)
|
| 218 |
return df
|
| 219 |
|
| 220 |
-
df = load_data()
|
| 221 |
|
| 222 |
# 4. SIDEBAR & FILTERS
|
| 223 |
with st.sidebar:
|
| 224 |
-
st.markdown("### S.T.A.R.K AI Control")
|
| 225 |
st.markdown("---")
|
|
|
|
|
|
|
|
|
|
|
|
|
| 226 |
|
| 227 |
state_list = ['All'] + sorted(df['state'].unique().tolist())
|
| 228 |
-
|
|
|
|
| 229 |
|
| 230 |
-
|
| 231 |
-
|
| 232 |
-
|
| 233 |
-
else:
|
| 234 |
-
filtered_df = df.copy()
|
| 235 |
-
district_list = ['All']
|
| 236 |
-
|
| 237 |
-
selected_district = st.selectbox("Select District", district_list)
|
| 238 |
|
| 239 |
-
if selected_district != 'All':
|
| 240 |
-
filtered_df = filtered_df[filtered_df['district'] == selected_district]
|
| 241 |
-
|
| 242 |
st.markdown("---")
|
| 243 |
-
risk_filter = st.multiselect(
|
| 244 |
-
|
| 245 |
-
options=['Low', 'Medium', 'High', 'Critical'],
|
| 246 |
-
default=['High', 'Critical']
|
| 247 |
-
)
|
| 248 |
-
if risk_filter:
|
| 249 |
-
filtered_df = filtered_df[filtered_df['risk_category'].isin(risk_filter)]
|
| 250 |
|
| 251 |
st.markdown("---")
|
| 252 |
-
st.link_button("Open Notebook
|
| 253 |
-
st.
|
| 254 |
-
st.info(f"**User:** UIDAI_Officer\n\n**Team:** UIDAI_4571")
|
| 255 |
|
| 256 |
-
# 5. HEADER
|
| 257 |
col1, col2 = st.columns([3, 1])
|
| 258 |
with col1:
|
| 259 |
-
st.title("
|
| 260 |
-
st.markdown("Context-Aware Fraud Detection System")
|
| 261 |
with col2:
|
| 262 |
-
st.markdown("""
|
| 263 |
-
<div style="text-align: right; padding-top: 20px;">
|
| 264 |
-
<span class="status-badge bg-green">System Online</span>
|
| 265 |
-
<div style="font-size: 12px; color: #64748b; margin-top: 5px;">Live Monitor</div>
|
| 266 |
-
</div>
|
| 267 |
-
""", unsafe_allow_html=True)
|
| 268 |
|
| 269 |
st.markdown("---")
|
| 270 |
-
|
| 271 |
-
|
| 272 |
-
m1
|
| 273 |
-
|
| 274 |
-
|
| 275 |
-
|
| 276 |
-
|
| 277 |
-
|
| 278 |
-
m1.metric("Total Centers", f"{total_centers:,}", border=True)
|
| 279 |
-
m2.metric("High Risk Alerts", f"{high_risk}", delta="Action Required", delta_color="inverse", border=True)
|
| 280 |
-
m3.metric("Avg. Risk Score", f"{avg_risk:.1f}/100", border=True)
|
| 281 |
-
m4.metric("Weekend Spikes", f"{weekend_alerts}", "Unauthorized", delta_color="off", border=True)
|
| 282 |
-
|
| 283 |
st.markdown("##")
|
| 284 |
|
| 285 |
# 6. TABS
|
| 286 |
-
tab_map, tab_list, tab_charts = st.tabs(["Geographic Risk", "Priority List", "
|
| 287 |
|
| 288 |
with tab_map:
|
| 289 |
-
|
| 290 |
-
with
|
| 291 |
if not filtered_df.empty:
|
| 292 |
-
|
| 293 |
-
|
| 294 |
-
|
| 295 |
-
|
| 296 |
-
|
| 297 |
-
|
| 298 |
-
|
| 299 |
-
|
| 300 |
-
|
| 301 |
-
hover_name="pincode",
|
| 302 |
-
hover_data={"district": True, "state": True, "RISK_SCORE": True, "lat": False, "lon": False},
|
| 303 |
-
mapbox_style="open-street-map",
|
| 304 |
-
height=600,
|
| 305 |
-
title="<b>Live Fraud Risk Heatmap</b>"
|
| 306 |
-
)
|
| 307 |
-
fig_map.update_layout(margin={"r":0,"t":40,"l":0,"b":0})
|
| 308 |
-
st.plotly_chart(fig_map, use_container_width=True)
|
| 309 |
-
else:
|
| 310 |
-
st.warning("No data matches current filters.")
|
| 311 |
-
|
| 312 |
-
with col_details:
|
| 313 |
-
st.subheader("Top Hotspots")
|
| 314 |
if not filtered_df.empty:
|
| 315 |
-
|
| 316 |
-
for
|
| 317 |
-
|
| 318 |
-
st.markdown(f"""
|
| 319 |
-
<div style="background: white; padding: 12px; border-radius: 8px; border-left: 5px solid {color}; margin-bottom: 10px; box-shadow: 0 2px 4px rgba(0,0,0,0.05);">
|
| 320 |
-
<div style="font-weight: 600; color: #1e293b;">{district}</div>
|
| 321 |
-
<div style="font-size: 13px; color: #64748b;">Avg Risk: <b>{score:.1f}</b></div>
|
| 322 |
-
</div>
|
| 323 |
-
""", unsafe_allow_html=True)
|
| 324 |
|
| 325 |
with tab_list:
|
| 326 |
-
st.subheader("
|
| 327 |
-
|
| 328 |
-
|
| 329 |
-
st.
|
| 330 |
-
|
| 331 |
-
column_config={
|
| 332 |
-
"RISK_SCORE": st.column_config.ProgressColumn("Risk Probability", format="%d%%", min_value=0, max_value=100),
|
| 333 |
-
"date": st.column_config.DateColumn("Date", format="DD MMM YYYY"),
|
| 334 |
-
"total_activity": st.column_config.NumberColumn("Volume"),
|
| 335 |
-
"enrol_adult": st.column_config.NumberColumn("Adult Enrols"),
|
| 336 |
-
},
|
| 337 |
-
use_container_width=True, hide_index=True, height=400
|
| 338 |
-
)
|
| 339 |
-
csv = target_list.to_csv(index=False).encode('utf-8')
|
| 340 |
-
st.download_button("Download CSV", data=csv, file_name="uidai_stark_priority_list.csv", mime="text/csv", type="primary")
|
| 341 |
|
| 342 |
with tab_charts:
|
| 343 |
c1, c2 = st.columns(2)
|
| 344 |
with c1:
|
| 345 |
-
st.
|
| 346 |
-
|
| 347 |
-
|
| 348 |
-
|
| 349 |
-
|
| 350 |
-
title="Deviation from District Baseline",
|
| 351 |
-
labels={"ratio_deviation": "Deviation Score", "total_activity": "Daily Transactions"}
|
| 352 |
-
)
|
| 353 |
-
fig_scatter.add_hline(y=0.2, line_dash="dash", line_color="red", annotation_text="Fraud Threshold")
|
| 354 |
-
st.plotly_chart(fig_scatter, use_container_width=True)
|
| 355 |
with c2:
|
| 356 |
-
st.
|
| 357 |
-
|
| 358 |
-
|
| 359 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 360 |
|
| 361 |
st.markdown("---")
|
| 362 |
st.markdown("""<div style="text-align: center; font-size: 13px; color: #94a3b8;"><b>Project S.T.A.R.K AI</b> | UIDAI Hackathon 2026</div>""", unsafe_allow_html=True)
|
|
|
|
| 3 |
import plotly.express as px
|
| 4 |
import plotly.graph_objects as go
|
| 5 |
import numpy as np
|
| 6 |
+
from datetime import datetime, timedelta
|
| 7 |
|
| 8 |
# 1. PAGE CONFIGURATION
|
| 9 |
st.set_page_config(
|
|
|
|
| 13 |
initial_sidebar_state="expanded"
|
| 14 |
)
|
| 15 |
|
| 16 |
+
# 2. ENHANCED PROFESSIONAL STYLING (Optimized)
|
| 17 |
st.markdown("""
|
| 18 |
<style>
|
| 19 |
+
@import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700;800&display=swap');
|
| 20 |
+
.stApp { background: linear-gradient(135deg, #f8fafc 0%, #f1f5f9 100%); color: #0f172a; font-family: 'Inter', sans-serif; }
|
| 21 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 22 |
/* METRIC CARDS */
|
| 23 |
div[data-testid="stMetric"] {
|
| 24 |
+
background: linear-gradient(135deg, #ffffff 0%, #f8fafc 100%);
|
| 25 |
+
border: 1px solid #e2e8f0; border-radius: 12px; padding: 20px;
|
| 26 |
+
box-shadow: 0 4px 6px -1px rgba(0,0,0,0.1); transition: transform 0.2s;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 27 |
}
|
| 28 |
+
div[data-testid="stMetric"]:hover { transform: translateY(-2px); box-shadow: 0 10px 15px -3px rgba(0,0,0,0.1); }
|
| 29 |
+
div[data-testid="stMetricValue"] { color: #0f172a !important; font-weight: 800 !important; font-size: 2rem !important; }
|
| 30 |
+
div[data-testid="stMetricLabel"] { color: #64748b !important; font-weight: 600 !important; text-transform: uppercase; font-size: 0.75rem; letter-spacing: 0.05em; }
|
| 31 |
+
|
| 32 |
/* DATAFRAME */
|
| 33 |
+
div[data-testid="stDataFrame"] { border-radius: 8px; overflow: hidden; box-shadow: 0 1px 3px rgba(0,0,0,0.1); }
|
| 34 |
+
div[data-testid="stDataFrame"] div[role="columnheader"] {
|
| 35 |
+
background: linear-gradient(to bottom, #f8fafc, #f1f5f9) !important;
|
| 36 |
+
color: #0f172a !important; font-weight: 700 !important; border-bottom: 2px solid #cbd5e1 !important;
|
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
}
|
| 38 |
+
|
| 39 |
/* SIDEBAR */
|
| 40 |
+
[data-testid="stSidebar"] { background: linear-gradient(180deg, #1e293b 0%, #0f172a 100%); border-right: 1px solid #334155; }
|
| 41 |
+
[data-testid="stSidebar"] * { color: #f8fafc !important; }
|
| 42 |
+
[data-testid="stSidebar"] .stSelectbox label { color: #cbd5e1 !important; }
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 43 |
|
| 44 |
+
/* UI ELEMENTS */
|
| 45 |
+
h1 { background: linear-gradient(135deg, #0f172a 0%, #334155 100%); -webkit-background-clip: text; -webkit-text-fill-color: transparent; font-weight: 800 !important; }
|
| 46 |
+
.status-badge { display: inline-flex; align-items: center; padding: 6px 14px; border-radius: 9999px; font-size: 12px; font-weight: 700; text-transform: uppercase; box-shadow: 0 1px 3px rgba(0,0,0,0.1); }
|
| 47 |
+
.bg-red { background: linear-gradient(135deg, #fee2e2 0%, #fecaca 100%); color: #991b1b; }
|
| 48 |
+
.bg-green { background: linear-gradient(135deg, #dcfce7 0%, #bbf7d0 100%); color: #166534; }
|
| 49 |
+
.bg-amber { background: linear-gradient(135deg, #fef3c7 0%, #fde68a 100%); color: #92400e; }
|
|
|
|
|
|
|
|
|
|
|
|
|
| 50 |
|
| 51 |
+
/* TABS & BUTTONS */
|
| 52 |
+
.stTabs [data-baseweb="tab-list"] { gap: 8px; }
|
| 53 |
+
.stTabs [aria-selected="true"] { background: linear-gradient(135deg, #3b82f6 0%, #2563eb 100%); color: white !important; }
|
| 54 |
+
.stButton button { border-radius: 8px; font-weight: 600; }
|
| 55 |
+
|
| 56 |
+
/* HOTSPOTS */
|
| 57 |
+
.hotspot-card { background: white; padding: 16px; border-radius: 10px; border-left: 5px solid; margin-bottom: 12px; box-shadow: 0 2px 4px rgba(0,0,0,0.05); transition: all 0.2s; }
|
| 58 |
+
.hotspot-card:hover { transform: translateX(4px); box-shadow: 0 4px 6px rgba(0,0,0,0.1); }
|
| 59 |
.js-plotly-plot .plotly .main-svg { background-color: rgba(0,0,0,0) !important; }
|
| 60 |
</style>
|
| 61 |
""", unsafe_allow_html=True)
|
| 62 |
|
| 63 |
+
# 3. ENHANCED DATA LOADING
|
| 64 |
+
@st.cache_data(ttl=300)
|
| 65 |
def load_data():
|
| 66 |
try:
|
| 67 |
df = pd.read_csv('analyzed_aadhaar_data.csv')
|
| 68 |
+
st.toast("β
Data loaded successfully", icon="β
")
|
| 69 |
except FileNotFoundError:
|
| 70 |
+
st.toast("π Generating sample data...", icon="βΉοΈ")
|
| 71 |
+
dates = pd.date_range(start="2024-10-01", periods=300, freq='D')
|
| 72 |
+
districts = ['North District', 'South Region', 'East Zone', 'West End', 'Central Hub',
|
| 73 |
+
'Rural A', 'Urban B', 'Coastal District', 'Mountain Region', 'Valley Area']
|
| 74 |
df = pd.DataFrame({
|
| 75 |
+
'date': np.random.choice(dates, 300),
|
| 76 |
+
'state': np.random.choice([
|
| 77 |
+
'Maharashtra', 'Uttar Pradesh', 'Bihar', 'Karnataka', 'Delhi', 'West Bengal',
|
| 78 |
+
'Kerala', 'Assam', 'Rajasthan', 'Gujarat', 'Tamil Nadu', 'Madhya Pradesh',
|
| 79 |
+
'Telangana', 'Punjab', 'Haryana', 'Andhra Pradesh', 'Odisha', 'Chhattisgarh'
|
| 80 |
+
], 300),
|
| 81 |
+
'district': np.random.choice(districts, 300),
|
| 82 |
+
'pincode': np.random.randint(110001, 800000, 300),
|
| 83 |
+
'RISK_SCORE': np.random.beta(2, 5, 300) * 100,
|
| 84 |
+
'total_activity': np.random.gamma(4, 50, 300).astype(int),
|
| 85 |
+
'enrol_adult': np.random.gamma(3, 30, 300).astype(int),
|
| 86 |
+
'ratio_deviation': np.random.normal(0, 0.2, 300),
|
| 87 |
+
'is_weekend': np.random.choice([0, 1], 300, p=[0.72, 0.28])
|
| 88 |
})
|
| 89 |
|
| 90 |
+
if 'date' in df.columns: df['date'] = pd.to_datetime(df['date'])
|
|
|
|
| 91 |
|
| 92 |
+
# Precise Geometric Centers
|
| 93 |
state_centers = {
|
| 94 |
+
'Andaman and Nicobar Islands': (11.7401, 92.6586), 'Andhra Pradesh': (15.9129, 79.7400),
|
| 95 |
+
'Arunachal Pradesh': (28.2180, 94.7278), 'Assam': (26.2006, 92.9376), 'Bihar': (25.0961, 85.3131),
|
| 96 |
+
'Chandigarh': (30.7333, 76.7794), 'Chhattisgarh': (21.2787, 81.8661), 'Delhi': (28.7041, 77.1025),
|
| 97 |
+
'Goa': (15.2993, 74.1240), 'Gujarat': (22.2587, 71.1924), 'Haryana': (29.0588, 76.0856),
|
| 98 |
+
'Himachal Pradesh': (31.9579, 77.1095), 'Jammu and Kashmir': (33.7782, 76.5762), 'Jharkhand': (23.6102, 85.2799),
|
| 99 |
+
'Karnataka': (15.3173, 75.7139), 'Kerala': (10.8505, 76.2711), 'Ladakh': (34.1526, 77.5770),
|
| 100 |
+
'Madhya Pradesh': (22.9734, 78.6569), 'Maharashtra': (19.7515, 75.7139), 'Manipur': (24.6637, 93.9063),
|
| 101 |
+
'Meghalaya': (25.4670, 91.3662), 'Mizoram': (23.1645, 92.9376), 'Nagaland': (26.1584, 94.5624),
|
| 102 |
+
'Odisha': (20.9517, 85.0985), 'Puducherry': (11.9416, 79.8083), 'Punjab': (31.1471, 75.3412),
|
| 103 |
+
'Rajasthan': (27.0238, 74.2179), 'Sikkim': (27.5330, 88.5122), 'Tamil Nadu': (11.1271, 78.6569),
|
| 104 |
+
'Telangana': (18.1124, 79.0193), 'Tripura': (23.9408, 91.9882), 'Uttar Pradesh': (26.8467, 80.9462),
|
| 105 |
+
'Uttarakhand': (30.0668, 79.0193), 'West Bengal': (22.9868, 87.8550)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 106 |
}
|
| 107 |
|
| 108 |
+
# EXPANDED Aspect Ratio Definitions (Lat spread, Lon spread)
|
|
|
|
|
|
|
| 109 |
state_spreads = {
|
| 110 |
+
'Kerala': (1.2, 0.25), 'West Bengal': (1.4, 0.4), 'Assam': (0.4, 1.8),
|
| 111 |
+
'Maharashtra': (1.8, 2.2), 'Uttar Pradesh': (1.2, 2.5), 'Bihar': (0.8, 1.5),
|
| 112 |
+
'Delhi': (0.1, 0.12), 'Goa': (0.15, 0.15), 'Chandigarh': (0.04, 0.04),
|
| 113 |
+
'Gujarat': (1.5, 1.8), 'Rajasthan': (2.0, 2.0), 'Madhya Pradesh': (1.8, 2.5),
|
| 114 |
+
'Himachal Pradesh': (0.6, 0.8), 'Punjab': (0.8, 0.9), 'Haryana': (0.9, 0.8),
|
| 115 |
+
'Tamil Nadu': (1.2, 1.0), 'Karnataka': (1.5, 1.2), 'Telangana': (1.0, 1.0),
|
| 116 |
+
'Andhra Pradesh': (1.5, 1.5), 'Odisha': (1.2, 1.2), 'Chhattisgarh': (1.5, 0.9),
|
| 117 |
+
'Jharkhand': (0.8, 1.0), 'Jammu and Kashmir': (1.0, 1.5), 'Ladakh': (1.0, 1.5),
|
| 118 |
+
'Uttarakhand': (0.7, 0.8)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 119 |
}
|
| 120 |
|
|
|
|
|
|
|
| 121 |
def get_coords(row):
|
| 122 |
state = row.get('state', 'Delhi')
|
| 123 |
+
district = str(row.get('district', 'Unknown')).lower()
|
|
|
|
| 124 |
base_lat, base_lon = state_centers.get(state, (20.5937, 78.9629))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 125 |
|
| 126 |
+
# Safer Default if state not found
|
| 127 |
+
lat_scale, lon_scale = state_spreads.get(state, (0.7, 0.7))
|
|
|
|
| 128 |
|
| 129 |
+
lat_bias, lon_bias = 0, 0
|
| 130 |
+
bias = 0.6
|
| 131 |
|
| 132 |
+
if 'north' in district: lat_bias += lat_scale * bias
|
| 133 |
+
if 'south' in district: lat_bias -= lat_scale * bias
|
| 134 |
+
if 'east' in district: lon_bias += lon_scale * bias
|
| 135 |
+
if 'west' in district: lon_bias -= lon_scale * bias
|
| 136 |
|
| 137 |
+
np.random.seed(hash(state + district) % 2**32)
|
| 138 |
+
rf = 0.5 if (lat_bias or lon_bias) else 1.0
|
|
|
|
| 139 |
|
| 140 |
return pd.Series({
|
| 141 |
+
'lat': base_lat + lat_bias + np.random.uniform(-lat_scale*rf, lat_scale*rf) + np.random.normal(0, 0.04),
|
| 142 |
+
'lon': base_lon + lon_bias + np.random.uniform(-lon_scale*rf, lon_scale*rf) + np.random.normal(0, 0.04)
|
| 143 |
})
|
| 144 |
|
| 145 |
coords = df.apply(get_coords, axis=1)
|
| 146 |
+
df['lat'], df['lon'] = coords['lat'], coords['lon']
|
| 147 |
+
df['risk_category'] = pd.cut(df['RISK_SCORE'], bins=[-1, 50, 75, 85, 100], labels=['Low', 'Medium', 'High', 'Critical'])
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 148 |
return df
|
| 149 |
|
| 150 |
+
with st.spinner('Loading S.T.A.R.K AI System...'): df = load_data()
|
| 151 |
|
| 152 |
# 4. SIDEBAR & FILTERS
|
| 153 |
with st.sidebar:
|
| 154 |
+
st.markdown("### π‘οΈ S.T.A.R.K AI Control")
|
| 155 |
st.markdown("---")
|
| 156 |
+
if 'date' in df.columns:
|
| 157 |
+
min_d, max_d = df['date'].min().date(), df['date'].max().date()
|
| 158 |
+
dr = st.date_input("Date Range", value=(min_d, max_d), min_value=min_d, max_value=max_d)
|
| 159 |
+
if len(dr) == 2: df = df[(df['date'].dt.date >= dr[0]) & (df['date'].dt.date <= dr[1])]
|
| 160 |
|
| 161 |
state_list = ['All'] + sorted(df['state'].unique().tolist())
|
| 162 |
+
sel_state = st.selectbox("State", state_list)
|
| 163 |
+
filtered_df = df[df['state'] == sel_state] if sel_state != 'All' else df.copy()
|
| 164 |
|
| 165 |
+
dist_list = ['All'] + sorted(filtered_df['district'].unique().tolist())
|
| 166 |
+
sel_dist = st.selectbox("District", dist_list)
|
| 167 |
+
if sel_dist != 'All': filtered_df = filtered_df[filtered_df['district'] == sel_dist]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 168 |
|
|
|
|
|
|
|
|
|
|
| 169 |
st.markdown("---")
|
| 170 |
+
risk_filter = st.multiselect("Risk Level", ['Low', 'Medium', 'High', 'Critical'], default=['High', 'Critical'])
|
| 171 |
+
if risk_filter: filtered_df = filtered_df[filtered_df['risk_category'].isin(risk_filter)]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 172 |
|
| 173 |
st.markdown("---")
|
| 174 |
+
st.link_button("π Open Analysis Notebook", "https://colab.research.google.com/drive/1YAQ4nfxltvG_cts3fmGc_zi2JQc4oPOT?usp=sharing", use_container_width=True)
|
| 175 |
+
st.info(f"**User:** UIDAI_Officer\n\n**Team:** UIDAI_4571\n\n**Update:** {datetime.now().strftime('%H:%M:%S')}")
|
|
|
|
| 176 |
|
| 177 |
+
# 5. HEADER & METRICS
|
| 178 |
col1, col2 = st.columns([3, 1])
|
| 179 |
with col1:
|
| 180 |
+
st.title("π‘οΈ S.T.A.R.K AI Dashboard")
|
| 181 |
+
st.markdown("**Context-Aware Fraud Detection & Prevention System**")
|
| 182 |
with col2:
|
| 183 |
+
st.markdown(f"""<div style="text-align: right; padding-top: 20px;"><span class="status-badge bg-green">β System Online</span><div style="font-size: 12px; color: #64748b; margin-top: 8px;">{datetime.now().strftime('%d %b %Y')}</div></div>""", unsafe_allow_html=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 184 |
|
| 185 |
st.markdown("---")
|
| 186 |
+
m1, m2, m3, m4, m5 = st.columns(5)
|
| 187 |
+
total, high, crit = len(filtered_df), len(filtered_df[filtered_df['RISK_SCORE'] > 75]), len(filtered_df[filtered_df['RISK_SCORE'] > 85])
|
| 188 |
+
m1.metric("Total Centers", f"{total:,}", border=True)
|
| 189 |
+
m2.metric("High Risk", f"{high}", delta="Review", delta_color="inverse", border=True)
|
| 190 |
+
m3.metric("Critical", f"{crit}", delta="Urgent", delta_color="inverse", border=True)
|
| 191 |
+
m4.metric("Avg Risk", f"{filtered_df['RISK_SCORE'].mean():.1f}/100" if not filtered_df.empty else "0", border=True)
|
| 192 |
+
m5.metric("Weekend Spikes", f"{len(filtered_df[(filtered_df['is_weekend'] == 1) & (filtered_df['RISK_SCORE'] > 70)])}", delta="Suspicious", delta_color="off", border=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 193 |
st.markdown("##")
|
| 194 |
|
| 195 |
# 6. TABS
|
| 196 |
+
tab_map, tab_list, tab_charts, tab_insights = st.tabs(["πΊοΈ Geographic Risk", "π Priority List", "π Patterns", "π AI Insights"])
|
| 197 |
|
| 198 |
with tab_map:
|
| 199 |
+
c_map, c_det = st.columns([3, 1])
|
| 200 |
+
with c_map:
|
| 201 |
if not filtered_df.empty:
|
| 202 |
+
fig = px.scatter_mapbox(filtered_df, lat="lat", lon="lon", color="RISK_SCORE", size="total_activity",
|
| 203 |
+
color_continuous_scale=["#22c55e", "#fbbf24", "#f97316", "#ef4444"], size_max=25, zoom=4.8 if sel_state != 'All' else 3.8,
|
| 204 |
+
center={"lat": 22.0, "lon": 80.0}, hover_name="district", mapbox_style="carto-positron", height=650, title="<b>Live Fraud Risk Heatmap</b>")
|
| 205 |
+
fig.update_layout(margin={"r":0,"t":40,"l":0,"b":0})
|
| 206 |
+
st.plotly_chart(fig, use_container_width=True)
|
| 207 |
+
else: st.warning("No data found.")
|
| 208 |
+
|
| 209 |
+
with c_det:
|
| 210 |
+
st.subheader("π₯ Top Hotspots")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 211 |
if not filtered_df.empty:
|
| 212 |
+
top = filtered_df.groupby('district').agg({'RISK_SCORE': 'mean', 'total_activity': 'sum'}).sort_values('RISK_SCORE', ascending=False).head(5)
|
| 213 |
+
for i, (d, r) in enumerate(top.iterrows(), 1):
|
| 214 |
+
clr, bdg = ("#ef4444", "CRITICAL") if r['RISK_SCORE'] > 85 else ("#f97316", "HIGH")
|
| 215 |
+
st.markdown(f"""<div class="hotspot-card" style="border-left-color: {clr};"><b>#{i} {d}</b><br><span style="font-size:12px;color:#64748b">Risk: <b style="color:{clr}">{r['RISK_SCORE']:.1f}</b> | Act: {int(r['total_activity'])}</span></div>""", unsafe_allow_html=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 216 |
|
| 217 |
with tab_list:
|
| 218 |
+
st.subheader("π― Priority Investigation")
|
| 219 |
+
targets = filtered_df[filtered_df['RISK_SCORE'] > 75].sort_values('RISK_SCORE', ascending=False)
|
| 220 |
+
csv = targets.to_csv(index=False).encode('utf-8')
|
| 221 |
+
st.download_button("π₯ Export CSV", data=csv, file_name="stark_priority.csv", mime="text/csv", type="primary")
|
| 222 |
+
st.dataframe(targets[['date', 'state', 'district', 'pincode', 'enrol_adult', 'total_activity', 'RISK_SCORE']],
|
| 223 |
+
column_config={"RISK_SCORE": st.column_config.ProgressColumn("Risk", format="%.1f%%", min_value=0, max_value=100)}, use_container_width=True, hide_index=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 224 |
|
| 225 |
with tab_charts:
|
| 226 |
c1, c2 = st.columns(2)
|
| 227 |
with c1:
|
| 228 |
+
st.markdown("**Ghost ID Detection**")
|
| 229 |
+
fig = px.scatter(filtered_df, x="total_activity", y="ratio_deviation", color="risk_category", size="RISK_SCORE",
|
| 230 |
+
color_discrete_map={'Critical': '#ef4444', 'High': '#f97316', 'Medium': '#eab308', 'Low': '#22c55e'}, height=350)
|
| 231 |
+
fig.add_hline(y=0.2, line_dash="dash", line_color="red")
|
| 232 |
+
st.plotly_chart(fig, use_container_width=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 233 |
with c2:
|
| 234 |
+
st.markdown("**Weekend Activity Analysis**")
|
| 235 |
+
wk_counts = filtered_df.groupby('is_weekend')['total_activity'].sum().reset_index()
|
| 236 |
+
wk_counts['Type'] = wk_counts['is_weekend'].map({0: 'Weekday', 1: 'Weekend'})
|
| 237 |
+
fig = px.bar(wk_counts, x='Type', y='total_activity', color='Type', color_discrete_map={'Weekday': '#3b82f6', 'Weekend': '#ef4444'}, height=350)
|
| 238 |
+
st.plotly_chart(fig, use_container_width=True)
|
| 239 |
+
|
| 240 |
+
with tab_insights:
|
| 241 |
+
st.subheader("π AI Detective Insights")
|
| 242 |
+
if not filtered_df.empty:
|
| 243 |
+
anom = filtered_df[filtered_df['ratio_deviation'] > 0.4]
|
| 244 |
+
st.info(f"π€ **AI Analysis:** Detected {len(anom)} centers with statistically significant enrollment deviations (> 2Ο from mean).")
|
| 245 |
+
|
| 246 |
+
c_i1, c_i2 = st.columns(2)
|
| 247 |
+
with c_i1:
|
| 248 |
+
st.markdown("#### π¨ Primary Risk Factors")
|
| 249 |
+
st.markdown("- **High Volume on Weekends:** 28% correlation with fraud")
|
| 250 |
+
st.markdown("- **Adult Enrollment Spikes:** 45% correlation with ghost IDs")
|
| 251 |
+
with c_i2:
|
| 252 |
+
st.markdown("#### π‘ Recommended Actions")
|
| 253 |
+
st.markdown(f"1. Immediate audit of {len(filtered_df[filtered_df['RISK_SCORE']>90])} centers with >90 Risk Score")
|
| 254 |
+
st.markdown("2. Deploy biometric re-verification for 'Rural A' cluster")
|
| 255 |
|
| 256 |
st.markdown("---")
|
| 257 |
st.markdown("""<div style="text-align: center; font-size: 13px; color: #94a3b8;"><b>Project S.T.A.R.K AI</b> | UIDAI Hackathon 2026</div>""", unsafe_allow_html=True)
|