Spaces:

Peter512
/

developer-salary-predictor

Sleeping

App Files Files Community

Peter512 commited on Oct 9, 2025

Commit

b8ffbce

verified ·

1 Parent(s): a7a06f6

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -51

app.py CHANGED Viewed

@@ -349,70 +349,42 @@ if st.session_state.get('has_prediction', False):
         with col1:
             st.subheader("📈 Top Contributing Factors")
-            # Create feature mapping for better readability
-            def clean_feature_name(feature):
-                """Convert technical feature names to user-friendly labels"""
                 # Store original for fallback
                 original = feature
                 # Remove prefixes
                 feature = feature.replace('cat__', '').replace('num__', '').replace('remainder__', '')
-                # Simple mappings
                 simple_map = {
-                    'years_code_pro': 'Years of Experience',
-                    'age_group': 'Age Group',
-                    'so_account': 'Stack Overflow Account',
-                    'ai_select': 'Uses AI Tools'
                 }
                 if feature in simple_map:
                     return simple_map[feature]
-                # Handle categorical variables with prefixes
                 replacements = {
-                    'country_': 'Country: ',
-                    'remote_work_': 'Work: ',
-                    'dev_type_': 'Role: ',
-                    'org_size_': 'Company: ',
-                    'ed_level_': 'Education: '
                 }
-                for prefix, label in replacements.items():
                     if prefix in feature:
-                        return label + feature.replace(prefix, '').replace('_', ' ')
                 # Fallback: just clean up underscores and return
                 return feature.replace('_', ' ').title()
-            # Create emoji version for the table only
-            def clean_feature_name_with_emoji(feature):
-                """Convert technical feature names to user-friendly labels WITH emojis"""
-                # Get base cleaned name
-                base_name = clean_feature_name(feature)
-                # Add emojis based on content
-                if 'Years of Experience' in base_name:
-                    return '⏱️ ' + base_name
-                elif 'Age Group' in base_name:
-                    return '👤 ' + base_name
-                elif 'Country:' in base_name:
-                    return '🌍 ' + base_name
-                elif 'Work:' in base_name:
-                    return '🏠 ' + base_name
-                elif 'Role:' in base_name:
-                    return '💻 ' + base_name
-                elif 'Company:' in base_name:
-                    return '🏢 ' + base_name
-                elif 'Education:' in base_name:
-                    return '🎓 ' + base_name
-                elif 'Stack Overflow' in base_name:
-                    return '📚 ' + base_name
-                elif 'AI Tools' in base_name:
-                    return '🤖 ' + base_name
-                return base_name
             shap_df = pd.DataFrame({
                 'Feature': feature_names,
                 'SHAP Value': shap_values[0],
@@ -421,16 +393,18 @@ if st.session_state.get('has_prediction', False):
             shap_df['Abs SHAP'] = shap_df['SHAP Value'].abs()
             shap_df = shap_df.sort_values('Abs SHAP', ascending=False).head(10)
-            # Clean feature names
-            shap_df['Feature_Clean'] = shap_df['Feature'].apply(clean_feature_name)
             shap_df['Feature_Clean_Emoji'] = shap_df['Feature'].apply(clean_feature_name_with_emoji)
-            # Debug: Print to verify (optional - remove in production)
-            # st.write("Debug - Feature names:", list(zip(shap_df['Feature'], shap_df['Feature_Clean'])))
             # Create visualization with improved styling
             fig, ax = plt.subplots(figsize=(10, 6))
             # Modern color scheme
             colors = ['#10b981' if x > 0 else '#ef4444' for x in shap_df['SHAP Value']]
@@ -462,9 +436,9 @@ if st.session_state.get('has_prediction', False):
                     fontweight='bold', fontsize=10,
                     color=color)
-            # Set labels with cleaned names (no emojis)
             ax.set_yticks(range(len(shap_df)))
-            ax.set_yticklabels(shap_df['Feature_Clean'], fontsize=10)
             ax.set_xlabel('Impact on Salary (EUR)', fontsize=11, fontweight='bold')
             ax.set_title('How Different Factors Affect Your Salary',
                         fontsize=13, fontweight='bold', pad=20)

         with col1:
             st.subheader("📈 Top Contributing Factors")
+            # Create feature mapping for better readability WITH emojis
+            def clean_feature_name_with_emoji(feature):
+                """Convert technical feature names to user-friendly labels WITH emojis"""
                 # Store original for fallback
                 original = feature
                 # Remove prefixes
                 feature = feature.replace('cat__', '').replace('num__', '').replace('remainder__', '')
+                # Simple mappings with emojis
                 simple_map = {
+                    'years_code_pro': '⏱️ Years of Experience',
+                    'age_group': '👤 Age Group',
+                    'so_account': '📚 Stack Overflow Account',
+                    'ai_select': '🤖 Uses AI Tools'
                 }
                 if feature in simple_map:
                     return simple_map[feature]
+                # Handle categorical variables with prefixes and emojis
                 replacements = {
+                    'country_': ('🌍 Country: ', ''),
+                    'remote_work_': ('🏠 Work: ', ''),
+                    'dev_type_': ('💻 Role: ', ''),
+                    'org_size_': ('🏢 Company Size: ', ''),
+                    'ed_level_': ('🎓 Education: ', '')
                 }
+                for prefix, (emoji_label, _) in replacements.items():
                     if prefix in feature:
+                        return emoji_label + feature.replace(prefix, '').replace('_', ' ')
                 # Fallback: just clean up underscores and return
                 return feature.replace('_', ' ').title()
             shap_df = pd.DataFrame({
                 'Feature': feature_names,
                 'SHAP Value': shap_values[0],
             shap_df['Abs SHAP'] = shap_df['SHAP Value'].abs()
             shap_df = shap_df.sort_values('Abs SHAP', ascending=False).head(10)
+            # Clean feature names with emojis
             shap_df['Feature_Clean_Emoji'] = shap_df['Feature'].apply(clean_feature_name_with_emoji)
             # Create visualization with improved styling
             fig, ax = plt.subplots(figsize=(10, 6))
+            # Set font that supports emojis (try different options for compatibility)
+            try:
+                plt.rcParams['font.family'] = 'DejaVu Sans'
+            except:
+                pass
             # Modern color scheme
             colors = ['#10b981' if x > 0 else '#ef4444' for x in shap_df['SHAP Value']]
                     fontweight='bold', fontsize=10,
                     color=color)
+            # Set labels with cleaned names WITH EMOJIS
             ax.set_yticks(range(len(shap_df)))
+            ax.set_yticklabels(shap_df['Feature_Clean_Emoji'], fontsize=10)
             ax.set_xlabel('Impact on Salary (EUR)', fontsize=11, fontweight='bold')
             ax.set_title('How Different Factors Affect Your Salary',
                         fontsize=13, fontweight='bold', pad=20)