import pandas as pd
import plotly.express as px
import plotly.graph_objects as go
from dash import Dash, dcc, html, Input, Output, State, ctx
import dash_daq as daq
import numpy as np
import dash_bootstrap_components as dbc
# 1. Data Loading & Preprocessing
df_global = pd.read_csv("merged_global.csv")
df_hemi = pd.read_csv("hemispheric_merged.csv")
# Merge by Year and Month
df = pd.merge(df_global, df_hemi, on=["year", "month"], suffixes=("", "_hemi"))
# For the seaosnal analysis categorizing the months
def get_season(month):
return {
12: "DJF", 1: "DJF", 2: "DJF",
3: "MAM", 4: "MAM", 5: "MAM",
6: "JJA", 7: "JJA", 8: "JJA",
9: "SON", 10: "SON", 11: "SON"
}[month]
df["Season"] = df["month"].apply(get_season)
# 2. App Initialization
app = Dash(__name__)
app.title = "Correlation & Insight Explorer"
# Define the variables for the dropdowns
def get_variables(scope):
if scope == "global":
return {
"co2_anomaly": "COβ Anomaly",
"land_ocean_anomaly": "Global Land+Ocean Temp Anomaly",
"land_anomaly": "Global Land Temp Anomaly",
"msl_mm": "Sea Level Change"
}
elif scope == "nh":
return {
"north_co2_anomaly": "NH COβ Anomaly",
"north_land_ocean_anomaly": "NH Land+Ocean Temp Anomaly",
"north_land_anomaly": "NH Land Temp Anomaly",
"msl_mm_north": "NH Sea Level Change"
}
elif scope == "sh":
return {
"south_co2_anomaly": "SH COβ Anomaly",
"south_land_ocean_anomaly": "SH Land+Ocean Temp Anomaly",
"south_land_anomaly": "SH Land Temp Anomaly",
"msl_mm_south": "SH Sea Level Change"
}
# 3. App Layout
app = Dash(__name__, external_stylesheets=[dbc.themes.FLATLY])
app.title = "Correlation & Insight Explorer"
app.layout = dbc.Container([
dbc.Row([
dbc.Col(html.H2("Correlation & Insight Explorer", className="text-center"), width=12)
], className="my-3"),
dbc.Row([
dbc.Col([
html.Label("Scope"),
dcc.RadioItems(id="scope-selector", options=[
{"label": "π Global", "value": "global"},
{"label": "π Northern Hemisphere", "value": "nh"},
{"label": "π Southern Hemisphere", "value": "sh"}
], value="global", labelStyle={"display": "block"})
], md=6),
dbc.Col([
html.Label("Theme"),
daq.ToggleSwitch(id='theme-toggle', label=['Light', 'Dark'], value=False)
], md=6)
], className="mb-3"),
dbc.Row([
dbc.Col([
html.Label("X-axis Variable"),
html.P("Select the variable for the X-axis"),
dcc.Dropdown(id='x-axis-dropdown', placeholder="Choose a variable for X-axis")
], md=6),
dbc.Col([
html.Label("Y-axis Variable"),
html.P("Select the variable for the Y-axis"),
dcc.Dropdown(id='y-axis-dropdown', placeholder="Choose a variable for Y-axis")
], md=6)
], className="mb-3"),
dbc.Row([
dbc.Col([
html.Label("Year Range"),
dcc.RangeSlider(
id='year-slider',
min=df['year'].min(), max=df['year'].max(),
value=[df['year'].min(), df['year'].max()],
marks={str(year): str(year) for year in range(df['year'].min(), df['year'].max()+1, 5)},
step=1
),
html.Label("View Mode", style={'marginTop': '10px'}),
dcc.RadioItems(
id='view-mode',
options=[
{"label": "Monthly", "value": "Monthly"},
{"label": "Seasonal", "value": "Seasonal"}
],
value="Monthly",
labelStyle={"display": "inline-block", "margin-right": "10px"}
)
], md=12)
], className="mb-4"),
dbc.Card([
dbc.CardHeader("π What Youβre Seeing β Climate Insights"),
dbc.CardBody([
html.P("This interactive tool allows you to explore the statistical relationships between climate indicators:"),
html.Ul([
html.Li("π± Human-induced COβ emissions heat the planet β‘οΈ"),
html.Li("π‘οΈ Rising COβ leads to higher land and ocean temperatures β‘οΈ"),
html.Li("π Warmer climates cause sea level rise through ice melt and ocean expansion.")
]),
html.P("Switch views (Global, Northern, Southern Hemisphere) and select indicators and years to compare."),
html.P("The scatter plot shows how the selected variables change together, with a regression trendline and RΒ² value."),
html.P("Pearson's r (shown in the heatmap and above the scatter) helps you evaluate correlation strength."),
html.P("The correlation heatmap reveals how all indicators relate within your selected range.")
])
], className="mb-4"),
html.Div(id='correlation-note', style={'padding': '10px', 'fontSize': '16px'}),
dcc.Graph(id='scatter-plot'),
html.H4("Correlation Matrix (Pearson)", className="text-center mt-4"),
dcc.Graph(id='correlation-heatmap')
], fluid=True)
# 4. Callbacks
@app.callback(
Output('x-axis-dropdown', 'options'),
Output('y-axis-dropdown', 'options'),
Output('x-axis-dropdown', 'value'),
Output('y-axis-dropdown', 'value'),
Input('scope-selector', 'value') )
def update_variable_options(scope):
vars = get_variables(scope)
options = [{'label': v, 'value': k} for k, v in vars.items()]
return options, options, list(vars.keys())[0], list(vars.keys())[1]
@app.callback(
Output('scatter-plot', 'figure'),
Output('correlation-heatmap', 'figure'),
Output('correlation-note', 'children'),
Input('x-axis-dropdown', 'value'),
Input('y-axis-dropdown', 'value'),
Input('year-slider', 'value'),
Input('view-mode', 'value'),
Input('scope-selector', 'value'),
Input('theme-toggle', 'value')
)
def update_visuals(x_var, y_var, year_range,view_mode, scope, dark_mode):
vars_dict = get_variables(scope)
dff = df[(df["year"] >= year_range[0]) & (df["year"] <= year_range[1])]
"""
Updating both charts based on user inputs
Supports theme switching and monthly/seasonal toggling.
"""
# If the view mode switched one the seasonal the month columns are not needed
if view_mode == "Seasonal":
dff = dff.groupby(['year', 'Season']).mean(numeric_only=True).reset_index()
else:
dff = dff.copy()
r = dff[[x_var, y_var]].corr().iloc[0, 1]
strength = "No correlation"
if abs(r) > 0.8:
strength = "π Very strong correlation"
elif abs(r) > 0.6:
strength = "π Strong correlation"
elif abs(r) > 0.4:
strength = "π Moderate correlation"
elif abs(r) > 0.2:
strength = "π Weak correlation"
elif abs(r) > 0:
strength = "π Very weak correlation"
corr_sentence = f"{strength} detected (r = {r:.2f})"
# Scatter Plot with Regression
fig = px.scatter(
dff, x=x_var, y=y_var, trendline="ols",
title=f"{vars_dict[x_var]} vs {vars_dict[y_var]}",
labels={x_var: vars_dict[x_var], y_var: vars_dict[y_var]},
template="plotly_dark" if dark_mode else "plotly_white"
)
fig.update_traces(
hovertemplate=f"Year: %{{customdata[0]}}
Month/Season: %{{customdata[1]}}
{vars_dict[x_var]}: %{{x:.3f}}
{vars_dict[y_var]}: %{{y:.3f}}",
customdata=dff[["year", "Season"]] if view_mode == "Seasonal" else dff[["year", "month"]]
)
# Add RΒ² if OLS exists
try:
results = px.get_trendline_results(fig)
r_squared = results.iloc[0]["px_fit_results"].rsquared
fig.add_annotation(
xref="paper", yref="paper",
x=0.95, y=0.05,
text=f"RΒ² = {r_squared:.2f}",
showarrow=False,
font=dict(size=14, color="white" if dark_mode else "black")
)
except:
pass
corr = dff[list(vars_dict.keys())].corr().round(2)
heatmap = go.Figure(data=go.Heatmap(
z=corr.values,
x=list(vars_dict.values()),
y=list(vars_dict.values()),
colorscale='Cividis',
zmin=-1, zmax=1,
colorbar=dict(title="Pearson r")
))
heatmap.update_layout(template="plotly_dark" if dark_mode else "plotly_white")
return fig, heatmap, corr_sentence
server = app.server # Required for gunicorn
# 5. Run app
if __name__ == '__main__':
app.run_server(debug=True, host='0.0.0.0', port=7860)
dbc.Row([
dbc.Col(html.Footer("Created by Irem R. as part of Bachelor Thesis at Riga Technical University β 2025", className="text-center text-muted"), width=12)
], className="mt-4")