Spaces:

ralate2
/

Group3FinalProjectPart3

Sleeping

App Files Files Community

ralate2 commited on Dec 10, 2024

Commit

d6169d6

verified ·

1 Parent(s): 018460a

Update app.py

Browse files

Files changed (1) hide show

app.py +67 -166

app.py CHANGED Viewed

@@ -435,86 +435,86 @@ elif viz_type == "Complaints by Housing Block and Type":
     The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
 """)
-# elif viz_type == "Complaints by Housing Block and Type (Incorporating Suggestions Based on Professor's Feedback)":
-#     st.subheader("Complaints by Housing Block and Type- Incorporating Suggestions Based on Professor's Feedback")
-#     # Filtering the data based on the selected year and housing block
-#     filtered_data_time = data  # Use filtered_data if date range is not needed
-#     if selected_year != 'All Time':
-#         filtered_data_time = filtered_data_time[filtered_data_time['Year Reported'] == selected_year]
-#     # Further filtering by Housing Block (if applicable)
-#     if selected_block != 'All Blocks':
-#         filtered_data_time = filtered_data_time[filtered_data_time['Housing Block'] == selected_block]
-#     # Pivoting the data based on the filtered data
-#     complaint_pivot = filtered_data_time.pivot_table(
-#         index='Housing Block',
-#         columns='Type of Complaint',
-#         values='Disposition',
-#         aggfunc='count',
-#         fill_value=0
-#     )
-#     # Ensuring the pivoted data is numeric for plotting
-#     complaint_pivot = complaint_pivot.astype(float)
-#     # Desired order for the housing blocks
-#     desired_order = [
-#         '1 block', '100 block', '200 block', '300 block', '400 block', '500 block',
-#         '600 block', '700 block', '800 block', '900 block', '1000 block', '1100 block',
-#         '1200 block', '1300 block', '1400 block', '1500 block', '1600 block',
-#         '1700 block', '1800 block', '1900 block', '2000 block', '2100 block',
-#         '2200 block', '2300 block', '2400 block', '2500 block', '2600 block',
-#         '2700 block', '2800 block', '2900 block', '3000 block', '3100 block',
-#         '3200 block', '3300 block', '3400 block', '3500 block', '3600 block',
-#         '3700 block', '3800 block', '3900 block', '4000 block', '4100 block',
-#         '4200 block', '4300 block', '4400 block', '4500 block', '4600 block',
-#         '4700 block', '4800 block', '4900 block', '5000 block'
-#     ]
-#     # Reordering the index of the pivot table according to the desired order
-#     complaint_pivot = complaint_pivot.reindex(desired_order)
-#     # Calculating percentages for each complaint type per housing block
-#     percentages = complaint_pivot.div(complaint_pivot.sum(axis=1), axis=0) * 100
-#     # Plotting the data
-#     fig = complaint_pivot.plot(kind='bar', stacked=True, colormap='inferno', figsize=(10, 6)).get_figure()
-#     # Adding percentage labels to the plot
-#     ax = fig.gca()
-#     for idx, block in enumerate(complaint_pivot.index):
-#         cumulative_height = 0
-#         for i, complaint_type in enumerate(complaint_pivot.columns):
-#             count = complaint_pivot.iloc[idx, i]
-#             percent = percentages.iloc[idx, i]
-#             if count > 0:
-#                 # Compute the position for the percentage label
-#                 x_pos = idx - 0.4 + 0.8 / 2  # Adjusting the position of the label
-#                 y_pos = cumulative_height + count / 2
-#                 ax.text(
-#                     x_pos, y_pos, f"{percent:.1f}%",
-#                     ha='center', va='center',
-#                     fontsize=10, color='black',
-#                     bbox=dict(facecolor='white', alpha=0.7, edgecolor='none')
-#                 )
-#             cumulative_height += count
-#     # Display the plot in Streamlit
-#     st.pyplot(fig)
-#     # writeup
-#     st.write("""
-#     **What this visualization shows:**
-#     This bar chart displays the distribution of complaints by Housing Block and Complaint Type. The data is stacked to show the percentage of complaints per block, categorized by type. This allows for a quick comparison of the most common complaint types across different housing blocks. While the percentages may be challenging to read when data for all blocks is displayed, they become more valuable and easier to interpret when a single block is selected. Selecting a specific block allows for clearer insights into the proportion of each complaint type within that block, providing more actionable information.
-#     **Why it's interesting:**
-#     By analyzing the distribution of complaints by both block and type, organizations can identify specific areas where certain complaint types are more prevalent. This insight helps target interventions and allocate resources more efficiently based on the most common issues in different housing blocks.
-#     **Color Scheme:**
-#     The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
-#     """)
 # In the above code , We incorporated all of the professor's suggestions and refined the chart to make it more useful for analysis while ensuring good aesthetics. Given that the data from block 3400 onwards is very sparse, we decided to exclude these records. This adjustment helped focus the visualization on the more relevant data, providing clearer insights and improving its overall effectiveness for analysis.
 # elif viz_type == "Complaints by Housing Block and Type (Incorporating Suggestions Based on Professor's Feedback)":
@@ -617,105 +617,6 @@ elif viz_type == "Complaints by Housing Block and Type":
 #     The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
 #     """)
-elif viz_type == "Complaints by Housing Block and Type (Incorporating Suggestions Based on Professor's Feedback)":
-    st.subheader("Complaints by Housing Block and Type - Incorporating Suggestions Based on Professor's Feedback")
-    # Filtering the data based on the selected year
-    filtered_data_time = data.copy()  # Use filtered_data if date range is not needed
-    if selected_year != 'All Time':
-        filtered_data_time = filtered_data_time[filtered_data_time['Year Reported'] == selected_year]
-    # Define available blocks (up to '3300 block')
-    available_blocks = [
-        '1 block', '100 block', '200 block', '300 block', '400 block', '500 block',
-        '600 block', '700 block', '800 block', '900 block', '1000 block',
-        '1100 block', '1200 block', '1300 block', '1400 block', '1500 block',
-        '1600 block', '1700 block', '1800 block', '1900 block',
-        '2000 block', '2100 block', '2200 block', '2300 block',
-        '2400 block', '2500 block', '2600 block',
-        '2700 block', '2800 block', '2900 block',
-        '3000 block', '3100 block',
-        '3200 block', '3300 block'
-    ]
-    # Ensure selected_block is in available_blocks
-    if selected_block not in available_blocks:
-        selected_block = None  # or set to a default value
-    # Further filtering by Housing Block (if applicable)
-    if selected_block and selected_block != 'All Blocks':
-        filtered_data_time = filtered_data_time[filtered_data_time['Housing Block'] == selected_block]
-    # Pivoting the data based on the filtered data
-    complaint_pivot = filtered_data_time.pivot_table(
-        index='Housing Block',
-        columns='Type of Complaint',
-        values='Disposition',
-        aggfunc='count',
-        fill_value=0
-    )
-    # Ensuring the pivoted data is numeric for plotting
-    complaint_pivot = complaint_pivot.astype(float)
-    # Desired order for the housing blocks (up to '3300 block')
-    desired_order = available_blocks
-    # Reordering the index of the pivot table according to the desired order
-    complaint_pivot = complaint_pivot.reindex(desired_order)
-    # Calculating percentages for each complaint type per housing block
-    percentages = complaint_pivot.div(complaint_pivot.sum(axis=1), axis=0) * 100
-    # Plotting the data
-    fig, ax = plt.subplots(figsize=(10, 6))
-    if selected_block and selected_block != 'All Blocks':
-        # Only show the selected housing block
-        complaint_pivot.loc[[selected_block]].plot(kind='bar', stacked=True, colormap='inferno', ax=ax)
-        # Set x-ticks to only show the selected housing block
-        ax.set_xticks([0])
-        ax.set_xticklabels([selected_block])
-    else:
-        # Show all blocks up to 3300
-        complaint_pivot.plot(kind='bar', stacked=True, colormap='inferno', ax=ax)
-    # Adding percentage labels to the plot
-    for idx, (block, row) in enumerate(complaint_pivot.iterrows()):
-        cumulative_height = 0
-        for i, complaint_type in enumerate(row):
-            count = row[i]
-            percent = percentages.loc[block, complaint_type] if count > 0 else 0
-            if count > 0:
-                # Compute the position for the percentage label within each segment
-                x_pos = idx if selected_block is None else 0  # Adjust x position based on selection
-                y_pos = cumulative_height + count / 2  # Center within each segment
-                ax.text(
-                    x_pos, y_pos, f"{percent:.1f}%",
-                    ha='center', va='center',
-                    fontsize=10, color='black',
-                    bbox=dict(facecolor='white', alpha=0.7, edgecolor='none')
-                )
-            cumulative_height += count
-    # Display the plot in Streamlit
-    st.pyplot(fig)
-    # Writeup
-    st.write("""
-    **What this visualization shows:**
-    This bar chart displays the distribution of complaints by Housing Block and Complaint Type. The data is stacked to show the percentage of complaints per block, categorized by type. This allows for a quick comparison of the most common complaint types across different housing blocks. While the percentages may be challenging to read when data for all blocks is displayed, they become more valuable and easier to interpret when a single block is selected. Selecting a specific block allows for clearer insights into the proportion of each complaint type within that block, providing more actionable information.
-    **Why it's interesting:**
-    By analyzing the distribution of complaints by both block and type, organizations can identify specific areas where certain complaint types are more prevalent. This insight helps target interventions and allocate resources more efficiently based on the most common issues in different housing blocks.
-    **Color Scheme:**
-    The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
-    """)
 # Footer
 st.markdown("---")

     The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
 """)
+elif viz_type == "Complaints by Housing Block and Type (Incorporating Suggestions Based on Professor's Feedback)":
+    st.subheader("Complaints by Housing Block and Type- Incorporating Suggestions Based on Professor's Feedback")
+    # Filtering the data based on the selected year and housing block
+    filtered_data_time = data  # Use filtered_data if date range is not needed
+    if selected_year != 'All Time':
+        filtered_data_time = filtered_data_time[filtered_data_time['Year Reported'] == selected_year]
+    # Further filtering by Housing Block (if applicable)
+    if selected_block != 'All Blocks':
+        filtered_data_time = filtered_data_time[filtered_data_time['Housing Block'] == selected_block]
+    # Pivoting the data based on the filtered data
+    complaint_pivot = filtered_data_time.pivot_table(
+        index='Housing Block',
+        columns='Type of Complaint',
+        values='Disposition',
+        aggfunc='count',
+        fill_value=0
+    )
+    # Ensuring the pivoted data is numeric for plotting
+    complaint_pivot = complaint_pivot.astype(float)
+    # Desired order for the housing blocks
+    desired_order = [
+        '1 block', '100 block', '200 block', '300 block', '400 block', '500 block',
+        '600 block', '700 block', '800 block', '900 block', '1000 block', '1100 block',
+        '1200 block', '1300 block', '1400 block', '1500 block', '1600 block',
+        '1700 block', '1800 block', '1900 block', '2000 block', '2100 block',
+        '2200 block', '2300 block', '2400 block', '2500 block', '2600 block',
+        '2700 block', '2800 block', '2900 block', '3000 block', '3100 block',
+        '3200 block', '3300 block', '3400 block', '3500 block', '3600 block',
+        '3700 block', '3800 block', '3900 block', '4000 block', '4100 block',
+        '4200 block', '4300 block', '4400 block', '4500 block', '4600 block',
+        '4700 block', '4800 block', '4900 block', '5000 block'
+    ]
+    # Reordering the index of the pivot table according to the desired order
+    complaint_pivot = complaint_pivot.reindex(desired_order)
+    # Calculating percentages for each complaint type per housing block
+    percentages = complaint_pivot.div(complaint_pivot.sum(axis=1), axis=0) * 100
+    # Plotting the data
+    fig = complaint_pivot.plot(kind='bar', stacked=True, colormap='inferno', figsize=(10, 6)).get_figure()
+    # Adding percentage labels to the plot
+    ax = fig.gca()
+    for idx, block in enumerate(complaint_pivot.index):
+        cumulative_height = 0
+        for i, complaint_type in enumerate(complaint_pivot.columns):
+            count = complaint_pivot.iloc[idx, i]
+            percent = percentages.iloc[idx, i]
+            if count > 0:
+                # Compute the position for the percentage label
+                x_pos = idx - 0.4 + 0.8 / 2  # Adjusting the position of the label
+                y_pos = cumulative_height + count / 2
+                ax.text(
+                    x_pos, y_pos, f"{percent:.1f}%",
+                    ha='center', va='center',
+                    fontsize=10, color='black',
+                    bbox=dict(facecolor='white', alpha=0.7, edgecolor='none')
+                )
+            cumulative_height += count
+    # Display the plot in Streamlit
+    st.pyplot(fig)
+    # writeup
+    st.write("""
+    **What this visualization shows:**
+    This bar chart displays the distribution of complaints by Housing Block and Complaint Type. The data is stacked to show the percentage of complaints per block, categorized by type. This allows for a quick comparison of the most common complaint types across different housing blocks. While the percentages may be challenging to read when data for all blocks is displayed, they become more valuable and easier to interpret when a single block is selected. Selecting a specific block allows for clearer insights into the proportion of each complaint type within that block, providing more actionable information.
+    **Why it's interesting:**
+    By analyzing the distribution of complaints by both block and type, organizations can identify specific areas where certain complaint types are more prevalent. This insight helps target interventions and allocate resources more efficiently based on the most common issues in different housing blocks.
+    **Color Scheme:**
+    The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
+    """)
 # In the above code , We incorporated all of the professor's suggestions and refined the chart to make it more useful for analysis while ensuring good aesthetics. Given that the data from block 3400 onwards is very sparse, we decided to exclude these records. This adjustment helped focus the visualization on the more relevant data, providing clearer insights and improving its overall effectiveness for analysis.
 # elif viz_type == "Complaints by Housing Block and Type (Incorporating Suggestions Based on Professor's Feedback)":
 #     The 'inferno' color palette is used to represent different complaint types, with darker shades indicating a higher frequency of complaints. The stacked bar chart makes it easy to compare the distribution of complaints by block and type.
 #     """)
 # Footer
 st.markdown("---")