import pandas as pd import plotly.express as px import pydeck as pdk import streamlit as st from streamlit_plotly_events import plotly_events # Group 5 Final Project - Part 2 Dashboard # Group Members: Nabeel Bashir, Tony An, Devansh Kumar, Jiajun Li # Streamlit application setup st.title('Group 5 Final Project - Part 2 (Dashboard)') st.text("Group Members: Nabeel Bashir, Tony An, Devansh Kumar, Jiajun Li") # Project URL st.text("The URL for this app is: https://huggingface.co/spaces/fa24-is445-group5/Final_Project_Part2") # Load the electric vehicle dataset ev_data = pd.read_csv('data/Electric_Vehicle_Population_Data.csv') # Dashboard introduction st.title('Electric Vehicle Population Data Dashboard') st.markdown('''Explore the electric vehicle data interactively using this dashboard. This dashboard helps experts and stakeholders understand the distribution and characteristics of electric vehicles in various counties and cities.''') # Dashboard usage explanation st.markdown('''### How to Use This Dashboard To explore the dataset, use the global filter options in the sidebar to filter by county and make. These filters will update all the visualizations, providing a focused view of the data. Alternatively, you can select a specific vehicle make directly in the "Vehicle Count by Make" chart. This selection will link to and update the rest of the visualizations to display data relevant to the selected make. All charts are interactive. You can click on bars to highlight corresponding data points in other charts, making it easier to discover patterns and relationships. The map is also interactive; you can zoom in, rotate, and click on points to see additional information about each vehicle.''') # Extract latitude and longitude from 'Vehicle Location' column ev_data[['Longitude', 'Latitude']] = ev_data['Vehicle Location'].str.extract(r'POINT \((-?\d+\.\d+) (-?\d+\.\d+)\)') ev_data['Latitude'] = pd.to_numeric(ev_data['Latitude'], errors='coerce') ev_data['Longitude'] = pd.to_numeric(ev_data['Longitude'], errors='coerce') # Sidebar filter options county_list = ev_data['County'].unique() make_list = ev_data['Make'].unique() selected_county = st.sidebar.selectbox('Select County', county_list) selected_make = st.sidebar.multiselect('Select Make', make_list, default=make_list) # Filter data based on sidebar selections filtered_data = ev_data[(ev_data['County'] == selected_county) & (ev_data['Make'].isin(selected_make))] # Display filtered data st.subheader('Filtered Data') st.write(filtered_data) # Interactive Bar Chart - Vehicle Count by Make st.subheader('Vehicle Count by Make') make_counts = filtered_data['Make'].value_counts().reset_index() make_counts.columns = ['Make', 'Count'] def create_bar_chart(selected_make=None): # If a make is selected, highlight it in blue, otherwise default to green if selected_make: make_counts['Color'] = make_counts['Make'].apply( lambda x: 'blue' if x == selected_make else 'green' ) color_map = make_counts.set_index('Make')['Color'] else: color_map = 'green' # Create a bar chart showing vehicle count by make chart = px.bar( make_counts, x='Make', y='Count', title="Vehicle Count by Make", labels={'Make': 'Vehicle Make', 'Count': 'Number of Vehicles'}, color='Make', color_discrete_map=color_map if isinstance(color_map, dict) else None ) chart.update_layout(clickmode='event+select') # Enable click interactions return chart # Display the bar chart and capture click data bar_chart = create_bar_chart(st.session_state.get('selected_make', None)) clicked_points = plotly_events(bar_chart, click_event=True, hover_event=False, select_event=False) # Update the selected make based on user interaction if clicked_points: st.session_state['selected_make'] = clicked_points[0]['x'] # Get clicked make else: st.session_state['selected_make'] = None # Display selected make selected_make = st.session_state['selected_make'] if selected_make: st.write(f"Selected Make: {selected_make}") # Filter data for the line chart based on selected make if selected_make: filtered_data = ev_data[ev_data['Make'] == selected_make] else: filtered_data = ev_data # Group data by model year for the filtered data model_year_data = filtered_data.groupby('Model Year').size().reset_index(name='Count') # Create the line chart for model count by year st.subheader(f"Number of Vehicles by Model Year for {selected_make if selected_make else 'All Makes'}") line_chart = px.line( model_year_data, x='Model Year', y='Count', title=f"Number of Vehicles by Model Year for {selected_make if selected_make else 'All Makes'}", labels={'Model Year': 'Year', 'Count': 'Number of Vehicles'}, markers=True ) # Display the line chart st.plotly_chart(line_chart, use_container_width=True) # Interactive Map of Vehicle Locations st.subheader('Map of Vehicle Locations') filtered_data = filtered_data.dropna(subset=['Latitude', 'Longitude']) filtered_data.rename(columns={'Latitude': 'latitude', 'Longitude': 'longitude'}, inplace=True) # Create an interactive map using PyDeck st.pydeck_chart(pdk.Deck( initial_view_state=pdk.ViewState( latitude=filtered_data['latitude'].mean(), longitude=filtered_data['longitude'].mean(), zoom=10, ), layers=[ pdk.Layer( 'ScatterplotLayer', data=filtered_data, get_position='[longitude, latitude]', get_radius=200, get_color='[200, 30, 0, 160]', pickable=True ) ], tooltip={ "html": "Make: {Make}
Model: {Model}
Electric Range: {Electric Range}", "style": { "backgroundColor": "steelblue", "color": "white" } } )) # Contextual datasets st.markdown('''### Contextual Datasets A potentially useful contextual dataset could be the [Electric Charging Stations Locations](https://afdc.energy.gov/fuels/electricity_locations.html). This dataset will provide information about the availability of charging stations in each county, allowing for a deeper analysis of the convenience and accessibility of electric vehicles in different regions.''') # Dataset size comment st.markdown('''### Dataset Size This dataset is uploaded huggingface repo using Git LFS, so there is no need to revise the plan for hosting this data.''')