Spaces:

aleuse
/

credit_score_prediction

Build error

App Files Files Community

Alexis Galvis commited on Mar 6, 2025

Commit

d790594

1 Parent(s): 84960aa

app

Browse files

Files changed (11) hide show

app.py +96 -0
data/output/loan_scores.pkl +3 -0
models/loan_model_2.h5 +3 -0
models/preprocessor.pkl +3 -0
requirements.txt +0 -0
utils/__pycache__/calculate_probability_prediction.cpython-310.pyc +0 -0
utils/__pycache__/category_classification.cpython-310.pyc +0 -0
utils/__pycache__/create_and_save_plot.cpython-310.pyc +0 -0
utils/calculate_probability_prediction.py +48 -0
utils/category_classification.py +15 -0
utils/create_and_save_plot.py +21 -0

app.py ADDED Viewed

	@@ -0,0 +1,96 @@

+import os
+import streamlit as st
+import numpy as np
+import tensorflow as tf
+import joblib
+import pandas as pd
+from utils.create_and_save_plot import plot_credit_score_distribution
+from utils.calculate_probability_prediction import probability_to_score_v3
+from utils.category_classification import credit_score_range_classification
+# Cargar modelo y preprocesador
+model = tf.keras.models.load_model("models/loan_model_2.h5")
+preprocessor = joblib.load("models/preprocessor.pkl")
+def calculate_dti(annual_income, total_monthly_debt):
+    """Calcula el Debt-to-Income Ratio (DTI)"""
+    if annual_income > 0:
+        monthly_income = annual_income / 12
+        dti = (total_monthly_debt / monthly_income) * 100
+        return round(dti, 2)
+    return 0
+# Interfaz Streamlit
+st.title("Predicción de Puntaje de Crédito")
+st.sidebar.header("Ingrese los valores del préstamo")
+# Nuevas variables de entrada con descripciones
+annual_inc = st.sidebar.number_input(
+    "Ingreso Anual (USD)", min_value=0.0, value=36000.0,
+    help="(float) Ingreso anual en dólares antes de impuestos."
+)
+emp_length = st.sidebar.selectbox(
+    "Tiempo en el Trabajo", ["< 1 year", "1-5 years", "6-10 years", "10+ years"],
+    help="(categoría) Duración del empleo actual."
+)
+home_ownership = st.sidebar.selectbox(
+    "Tipo de Propiedad", ["OWN", "MORTGAGE", "RENT"],
+    help="(categoría) Tipo de propiedad del solicitante."
+)
+purpose = st.sidebar.selectbox(
+    "Propósito del Préstamo", ["debt_consolidation", "credit_card", "home_improvement"],
+    help="(categoría) Razón principal del préstamo."
+)
+zip_code = st.sidebar.number_input(
+    "Código Postal", min_value=10000, max_value=99999, step=1, value=90210,
+    help="(int) Código postal de residencia del solicitante."
+)
+open_acc = st.sidebar.number_input(
+    "Cuentas Abiertas", min_value=0, step=1, value=5,
+    help="(int) Número total de cuentas de crédito abiertas."
+)
+total_monthly_debt = st.sidebar.number_input(
+    "Pagos Mensuales de Deuda (USD)", min_value=0.0, value=600.0,
+    help="(float) Total de pagos mensuales de deuda (préstamos, tarjetas, hipotecas)."
+)
+# Calcular DTI
+dti = calculate_dti(annual_inc, total_monthly_debt)
+st.sidebar.write(f"DTI Calculado: {dti}%")
+if st.sidebar.button("Predecir"):
+    # Crear el DataFrame con los datos de entrada
+    input_data = {
+        "annual_inc": [annual_inc],
+        "emp_length": [emp_length],
+        "home_ownership": [home_ownership],
+        "purpose": [purpose],
+        "zip_code": [zip_code],
+        "open_acc": [open_acc],
+        "dti": [dti]
+    }
+    df = pd.DataFrame(input_data)
+    # Preprocesar y predecir
+    data_processed = preprocessor.transform(df)
+    predictions = model.predict(data_processed).ravel()
+    y_scores = joblib.load(os.path.join('data', 'output', 'loan_scores.pkl'))
+    credit_score = probability_to_score_v3(predictions[0])
+    # Mostrar resultado
+    color = credit_score_range_classification(credit_score)
+    st.markdown(
+        f'<h2 style="color:{color};">Puntaje de Crédito Estimado: {credit_score:.2f}</h2>',
+        unsafe_allow_html=True
+    )
+    # Generar gráfico
+    buffer = plot_credit_score_distribution(y_scores, credit_score)
+    image_data = buffer.getvalue()
+    buffer.close()
+    st.image(image_data, caption="Distribución de Puntajes de Crédito", use_container_width=True)

data/output/loan_scores.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:67b1ef0919f5cff5e4732fa33c14334d830acf50b622c32bd44a63f8e4f5f98c
+size 474033

models/loan_model_2.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24adab470382c8e80311421fe2b6fbd1cf73d665888a93b3a47303f55bd9a3e7
+size 708384

models/preprocessor.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c2d49b06300e354172e421ff3e97c3c9fcc4cdafad346ad64e5da1275478b55
+size 5130

requirements.txt ADDED Viewed

Binary file (454 Bytes). View file

utils/__pycache__/calculate_probability_prediction.cpython-310.pyc ADDED Viewed

Binary file (1.27 kB). View file

utils/__pycache__/category_classification.cpython-310.pyc ADDED Viewed

Binary file (528 Bytes). View file

utils/__pycache__/create_and_save_plot.cpython-310.pyc ADDED Viewed

Binary file (964 Bytes). View file

utils/calculate_probability_prediction.py ADDED Viewed

	@@ -0,0 +1,48 @@

+import numpy as np
+def probability_to_score_v3(prob, base_score=300, max_score=850, threshold=0.326,
+                                   expansion_factor_low=3, expansion_factor_high=0.7):
+    """
+    Convierte probabilidades en puntajes de crédito con expansión no lineal
+    para distribuir mejor en los extremos.
+    Args:
+        prob (float): Probabilidad de default.
+        base_score (int): Puntaje base.
+        max_score (int): Puntaje máximo.
+        threshold (float): Valor de corte óptimo.
+        expansion_factor_low (float): Factor para expandir la parte baja del rango.
+        expansion_factor_high (float): Factor para expandir la parte alta del rango.
+    Returns:
+        score (float): Puntaje de crédito ajustado.
+    """
+    # Invertir la probabilidad para que mayor valor sea mejor score
+    inverted_prob = 1 - prob
+    # Punto de corte invertido
+    inverted_threshold = 1 - threshold
+    # Determinar si es un score alto o bajo
+    if inverted_prob >= inverted_threshold:  # Buenos clientes
+        # Normalizar la probabilidad en el rango de buenos
+        normalized = (inverted_prob - inverted_threshold) / (1 - inverted_threshold)
+        # Aplicar expansión no lineal
+        transformed = normalized ** expansion_factor_high
+        # Mapear al rango superior
+        mid_score = 550  # Punto medio del rango
+        score = mid_score + (max_score - mid_score) * transformed
+    else:  # Malos clientes
+        # Normalizar la probabilidad en el rango de malos
+        normalized = inverted_prob / inverted_threshold
+        # Aplicar expansión no lineal para los scores bajos
+        transformed = normalized ** expansion_factor_low
+        # Mapear al rango inferior
+        mid_score = 550  # Punto medio del rango
+        score = base_score + (mid_score - base_score) * transformed
+    # Asegurar que el score esté dentro del rango permitido
+    score = np.clip(score, base_score, max_score)
+    return score

utils/category_classification.py ADDED Viewed

	@@ -0,0 +1,15 @@

+def credit_score_range_classification(credit_score):
+    color = "white"
+    if (credit_score >= 300) and (credit_score <= 579):
+        color = "red"
+    elif (credit_score >= 580) and (credit_score <= 669):
+        color = "orange"
+    elif (credit_score >= 670) and (credit_score <= 739):
+        color = "yellow"
+    elif (credit_score >= 740) and (credit_score <= 799):
+        color = "lightgreen"
+    else:
+        color = "green"
+    return color

utils/create_and_save_plot.py ADDED Viewed

	@@ -0,0 +1,21 @@

+import matplotlib.pyplot as plt
+from io import BytesIO
+def plot_credit_score_distribution(scores, point):
+    plt.figure(figsize=(10, 6))
+    plt.hist(scores, bins=30, color='green', alpha=0.6)
+    plt.yscale('log')
+    plt.axvline(x=point, color='red', linestyle='--', label=f'Puntaje {point}')
+    plt.scatter(point, 1, color='red', s=100, zorder=5)
+    plt.title("Distribución de Puntajes de Crédito (300-850)")
+    plt.xlabel("Puntaje")
+    plt.ylabel("Frecuencia (escala logarítmica)")
+    plt.grid(True)
+    plt.legend()
+    buffer = BytesIO()
+    plt.savefig(buffer, format='png')
+    buffer.seek(0)  # Mover el puntero al inicio del buffer
+    plt.close()  # Cerrar la figura para liberar memoria
+    return buffer