Spaces:

MyEnny
/

Energy_grid_forcast

Sleeping

App Files Files Community

Energy_grid_forcast / app.py

MyEnny

changed model to pickle

05ac191 verified 5 months ago

raw

history blame contribute delete

13.1 kB

	import streamlit as st
	import pandas as pd
	import numpy as np
	import plotly.express as px
	import plotly.graph_objects as go
	from datetime import datetime, timedelta
	from joblib import load
	import requests
	import pytz
	import time


	# Constants
	SUPABASE_URL = "https://ubbyirdtynaerjodadal.supabase.co"
	SUPABASE_API_KEY = "eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJpc3MiOiJzdXBhYmFzZSIsInJlZiI6InViYnlpcmR0eW5hZXJqb2RhZGFsIiwicm9sZSI6ImFub24iLCJpYXQiOjE3NTI0OTIyNjcsImV4cCI6MjA2ODA2ODI2N30.iTHJ18BZED_gE5VyZrBp7YWiy6NNzsA1YdqeazFtxZI"
	TABLE = "smart_meter_readings_1year"
	TIMEZONE = pytz.timezone("Europe/London")
	now = pd.Timestamp.now(TIMEZONE)

	def auto_refresh(interval_seconds=60):
	time.sleep(interval_seconds)
	st.rerun()

	st.set_page_config(page_title="Electric Grid Dashboard", layout="wide")

	@st.cache_data(ttl=120)
	def load_data():
	url = f"{SUPABASE_URL}/rest/v1/{TABLE}?timestamp=lt.{datetime.now().isoformat()}"
	headers = {
	"apikey": SUPABASE_API_KEY,
	"Authorization": f"Bearer {SUPABASE_API_KEY}"
	}
	res = requests.get(url, headers=headers)
	if res.status_code != 200:
	st.error(f"Failed to fetch data: {res.status_code}")
	st.stop()
	df = pd.DataFrame(res.json())
	df['datetime'] = pd.to_datetime(df['timestamp'], utc=True)
	df['hour_of_day'] = df['datetime'].dt.hour
	df = df.set_index('datetime')
	df.sort_index(inplace=True)
	df['date'] = df.index.date
	df['week'] = df.index.isocalendar().week
	df['day_of_week'] = df.index.day_name()
	df['hour_sin'] = np.sin(2 * np.pi * df['hour_of_day'] / 24)
	df['hour_cos'] = np.cos(2 * np.pi * df['hour_of_day'] / 24)
	df['lag_30mins'] = df['power_consumption_kwh'].shift(1)
	df['lag_1hr'] = df['power_consumption_kwh'].shift(2)
	df['roll_mean_1hr'] = df['power_consumption_kwh'].shift(1).rolling(2).mean()
	df['roll_mean_2hr'] = df['power_consumption_kwh'].shift(1).rolling(4).mean()
	df[['lag_30mins', 'lag_1hr', 'roll_mean_1hr', 'roll_mean_2hr']] = df[[
	'lag_30mins', 'lag_1hr', 'roll_mean_1hr', 'roll_mean_2hr'
	]].ffill().fillna(0)


	df = df.drop(columns=['date', 'hour_of_day'])
	df = pd.get_dummies(df, columns=['region', 'property_type', 'day_of_week'], drop_first=False)
	df = df.astype({col: 'int' for col in df.select_dtypes('bool').columns})
	return df

	def main():
	# Load data and model
	data = load_data()
	model = load('rf_model.pkl')

	# Generate forecasts
	features = data.drop(columns=['power_consumption_kwh', 'timestamp'], errors='ignore')
	data['forecast'] = model.predict(features[model.feature_names_in_])

	# Calculate performance metrics
	latest_data = data.loc[data.index > pd.Timestamp.now(TIMEZONE) - pd.Timedelta('1D')]
	rmse = np.sqrt((latest_data['power_consumption_kwh'] - latest_data['forecast'])**2).mean()
	mae = (latest_data['power_consumption_kwh'] - latest_data['forecast']).abs().mean()
	current_error = (data['power_consumption_kwh'].iloc[-1] - data['forecast'].iloc[-1]) / data['power_consumption_kwh'].iloc[-1] * 100

	# Title and description
	st.title("🌡️ Real-Time Energy Dashboard")
	st.markdown("Monitoring power consumption, environmental factors, and forecast accuracy across regions")

	# Sidebar filters
	st.sidebar.header("Filter Options")
	# Build readable region and property_type filters
	region_columns = list(data.filter(like='region_').columns)
	region_labels = ['All'] + [col.replace('region_', '') for col in region_columns]
	region = st.sidebar.selectbox("Region", region_labels)

	property_columns = list(data.filter(like='property_type_').columns)
	property_labels = ['All'] + [col.replace('property_type_', '') for col in property_columns]
	property_selection = st.sidebar.selectbox("Property Type", property_labels)

	time_range = st.sidebar.select_slider("Time Range",
	options=['1h', '6h', '12h', '1D', '1W'],
	value='12h')
	filtered_data = data.copy()

	# Apply region filter
	if region != 'All':
	region_col = f"region_{region}"
	if region_col in filtered_data.columns:
	filtered_data = filtered_data[filtered_data[region_col] == 1]

	# Apply property_type filter
	if property_selection != 'All':
	property_col = f"property_type_{property_selection}"
	if property_col in filtered_data.columns:
	filtered_data = filtered_data[filtered_data[property_col] == 1]

	# Apply time filter
	filtered_data = filtered_data.loc[filtered_data.index > now - pd.Timedelta(time_range)]
	#filtered_data = filtered_data.loc[filtered_data.index > pd.Timestamp.now(tz='UTC') - pd.Timedelta(time_range)]

	# Current metrics
	current = filtered_data.iloc[-1]
	# show metrics here
	st.subheader("📊 Current Energy Status")
	col1, col2, col3, col4 = st.columns(4)
	col1.metric("Power Consumption", f"{current['power_consumption_kwh']:.2f} kWh",
	delta=f"{current_error:.1f}% error", delta_color="inverse")
	col2.metric("Voltage", f"{current['voltage']:.1f} V")
	col3.metric("Temperature", f"{current['temperature_c']:.1f}°C")
	col4.metric("Humidity", f"{current['humidity_pct']:.1f}%")

	# --- 2-Hour Forecast ---
	st.subheader("🔮 Next 2 Hours Forecast")

	latest_row = data.iloc[-1:].copy()
	forecast_steps = []
	timestamps = []

	for i in range(1, 5): # 4 steps = next 2 hours (30-min intervals)
	future_time = latest_row.index[0] + timedelta(minutes=30 * i)
	timestamps.append(future_time)

	hour = future_time.hour
	hour_sin = np.sin(2 * np.pi * hour / 24)
	hour_cos = np.cos(2 * np.pi * hour / 24)

	new_row = latest_row.copy()
	new_row.index = [future_time]
	new_row['hour_sin'] = hour_sin
	new_row['hour_cos'] = hour_cos

	# Lags and rolling values
	if i == 1:
	lag_30 = latest_row['power_consumption_kwh'].values[0]
	lag_1hr = latest_row['lag_30mins'].values[0]
	roll_1hr = np.mean([lag_30, lag_1hr])
	roll_2hr = np.mean([lag_30, lag_1hr, latest_row['lag_1hr'].values[0], latest_row['roll_mean_1hr'].values[0]])
	else:
	lag_30 = forecast_steps[-1]
	lag_1hr = forecast_steps[-2] if i > 2 else latest_row['power_consumption_kwh'].values[0]
	roll_1hr = np.mean([lag_30, lag_1hr])
	roll_2hr = np.mean(forecast_steps[-3:] + [lag_1hr]) if i > 3 else roll_1hr

	new_row['lag_30mins'] = lag_30
	new_row['lag_1hr'] = lag_1hr
	new_row['roll_mean_1hr'] = roll_1hr
	new_row['roll_mean_2hr'] = roll_2hr

	X_future = new_row[model.feature_names_in_]
	y_pred = model.predict(X_future)[0]
	forecast_steps.append(y_pred)

	# Format forecast results
	forecast_df = pd.DataFrame({
	"datetime": timestamps,
	"forecast_kwh": forecast_steps
	}).set_index("datetime")

	# --- Display 30 min / 1 hr / 2 hr Forecast ---
	col1, col2, col3 = st.columns(3)
	col1.metric("In 30 mins", f"{forecast_steps[0]:.2f} kWh", timestamps[0].strftime('%H:%M'))
	col2.metric("In 1 hour", f"{forecast_steps[1]:.2f} kWh", timestamps[1].strftime('%H:%M'))
	col3.metric("In 2 hours", f"{forecast_steps[3]:.2f} kWh", timestamps[3].strftime('%H:%M'))

	# Plot forecast
	fig_forecast = go.Figure()
	fig_forecast.add_trace(go.Scatter(x=forecast_df.index, y=forecast_df['forecast_kwh'],
	mode='lines+markers', name="Forecast"))
	fig_forecast.update_layout(title="2-Hour Ahead Forecast", xaxis_title="Time", yaxis_title="kWh")
	st.plotly_chart(fig_forecast, use_container_width=True)

	# Performance metrics
	# Model Performance: Current and 12-Hour Highs/Lows ---
	st.subheader("📏 Model Performance (Last 12 Hours, 30-Min Intervals)")

	# Step 1: Prepare error columns
	perf_df = data[['power_consumption_kwh', 'forecast']].copy()
	perf_df['error'] = perf_df['power_consumption_kwh'] - perf_df['forecast']
	perf_df['abs_error'] = perf_df['error'].abs()
	perf_df['squared_error'] = perf_df['error']**2

	# Step 2: Resample into 30-min intervals
	interval_perf = perf_df.resample('30min').agg({
	'squared_error': 'mean',
	'abs_error': 'mean'
	}).dropna()

	# Limit to last 12 hours
	end_time = interval_perf.index.max()
	start_time = end_time -timedelta(hours=12)
	last_12h_perf = interval_perf.loc[start_time:end_time].copy()
	last_12h_perf['RMSE'] = np.sqrt(last_12h_perf['squared_error'])
	last_12h_perf['MAE'] = last_12h_perf['abs_error']
	last_12h_perf = last_12h_perf[['RMSE', 'MAE']]

	# Step 3: Current metrics
	current_rmse = last_12h_perf['RMSE'].iloc[-1]
	current_mae = last_12h_perf['MAE'].iloc[-1]
	current_time = last_12h_perf.index[-1].strftime('%Y-%m-%d %H:%M')

	# Step 4: Highs and lows
	lowest_rmse = last_12h_perf['RMSE'].min()
	lowest_rmse_time = last_12h_perf['RMSE'].idxmin().strftime('%Y-%m-%d %H:%M')

	highest_rmse = last_12h_perf['RMSE'].max()
	highest_rmse_time = last_12h_perf['RMSE'].idxmax().strftime('%Y-%m-%d %H:%M')

	lowest_mae = last_12h_perf['MAE'].min()
	lowest_mae_time = last_12h_perf['MAE'].idxmin().strftime('%Y-%m-%d %H:%M')

	highest_mae = last_12h_perf['MAE'].max()
	highest_mae_time = last_12h_perf['MAE'].idxmax().strftime('%Y-%m-%d %H:%M')

	# Step 5: Display
	col1, col2 = st.columns(2)
	col1.metric("Current RMSE", f"{current_rmse:.3f} kWh", current_time)
	col2.metric("Current MAE", f"{current_mae:.3f} kWh", current_time)

	col3, col4, col5, col6 = st.columns(4)
	col3.metric("🔽 Lowest RMSE (12h)", f"{lowest_rmse:.3f} kWh", lowest_rmse_time)
	col4.metric("🔼 Highest RMSE (12h)", f"{highest_rmse:.3f} kWh", highest_rmse_time)
	col5.metric("🔽 Lowest MAE (12h)", f"{lowest_mae:.3f} kWh", lowest_mae_time)
	col6.metric("🔼 Highest MAE (12h)", f"{highest_mae:.3f} kWh", highest_mae_time)


	st.subheader("📈 RMSE and MAE over the Last 12 Hours")
	fig_errors = px.line(
	last_12h_perf,
	x=last_12h_perf.index,
	y=['RMSE', 'MAE'],
	labels={'value': 'Error (kWh)', 'variable': 'Metric', 'datetime': 'Time'},
	title="Model Error Metrics (30-Min Intervals)"
	)
	fig_errors.update_layout(
	xaxis_title="Time",
	yaxis_title="kWh",
	template="plotly_white",
	legend_title="Metric",
	height=350
	)
	st.plotly_chart(fig_errors, use_container_width=True)

	# Main content tabs
	tab1, tab2, tab3 = st.tabs(["Consumption Trends", "Regional Analysis", "Environmental Factors"])

	with tab1:
	fig1 = px.line(filtered_data, x=filtered_data.index,
	y=['power_consumption_kwh', 'forecast'],
	title="Power Consumption vs Forecast")
	st.plotly_chart(fig1, use_container_width=True)

	# Hourly pattern
	numeric_cols = filtered_data.select_dtypes(include=[np.number]).columns
	hourly = filtered_data[numeric_cols].groupby(filtered_data.index.hour).mean()
	fig2 = px.bar(hourly, x=hourly.index, y='power_consumption_kwh',
	title="Average Hourly Consumption Pattern")
	st.plotly_chart(fig2, use_container_width=True)

	with tab2:
	if 'region' in data.columns:
	region_breakdown = data.groupby('region')['power_consumption_kwh'].sum().reset_index()
	fig3 = px.pie(region_breakdown, names='region', values='power_consumption_kwh',
	title="Regional Consumption Share")
	st.plotly_chart(fig3, use_container_width=True)

	# Regional comparison
	if len(data.filter(like='region_').columns) > 0:
	region_cols = data.filter(like='region_').columns
	region_avg = data[region_cols].mean().reset_index()
	region_avg.columns = ['Region', 'Avg Consumption']
	fig4 = px.bar(region_avg, x='Region', y='Avg Consumption',
	title="Average Consumption by Region")
	st.plotly_chart(fig4, use_container_width=True)

	with tab3:
	fig5 = px.line(filtered_data, x=filtered_data.index,
	y=['temperature_c', 'humidity_pct'],
	title="Temperature & Humidity Trends")
	st.plotly_chart(fig5, use_container_width=True)

	fig6 = px.scatter(filtered_data, x='temperature_c', y='power_consumption_kwh',
	color='voltage', size='humidity_pct',
	title="Consumption vs Temperature (Colored by Voltage)")
	st.plotly_chart(fig6, use_container_width=True)


	# Footer
	st.markdown("---")
	st.markdown('Developed by Opeyemi Abodunrin')
	st.markdown(f"Last updated: {datetime.now(TIMEZONE).strftime('%Y-%m-%d %H:%M:%S')}")
	st.markdown("© 2025 Electric Forecast (Demonstration Purpose)")

	if __name__ == "__main__":
	main()
	auto_refresh(60)