File size: 6,340 Bytes
64ef255
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
"""
Iris Flower Classifier - Aplicaci贸n Gradio
============================================
Interfaz interactiva para clasificar flores Iris usando XGBoost.
"""

import gradio as gr
import joblib
import numpy as np
import pandas as pd
import json
import matplotlib.pyplot as plt
import seaborn as sns
import os

# Cargar modelo y metadata
model = joblib.load("model.joblib")
le = joblib.load("label_encoder.joblib")

with open("model_info.json") as f:
    model_info = json.load(f)

# Cargar datos para exploraci贸n
df = pd.read_csv("data/IRIS.csv")

# Rangos de features para los sliders
FEATURE_RANGES = {
    "sepal_length": (4.0, 8.0, 5.8),
    "sepal_width": (2.0, 4.5, 3.0),
    "petal_length": (1.0, 7.0, 3.8),
    "petal_width": (0.1, 2.5, 1.2),
}

SPECIES_EMOJI = {
    "Iris-setosa": "馃尭",
    "Iris-versicolor": "馃尯",
    "Iris-virginica": "馃尰",
}


def predict(sepal_length, sepal_width, petal_length, petal_width):
    """Predecir especie de Iris."""
    features = np.array([[sepal_length, sepal_width, petal_length, petal_width]])
    proba = model.predict_proba(features)[0]
    result = {
        f"{SPECIES_EMOJI.get(cls, '')} {cls}": float(p)
        for cls, p in zip(le.classes_, proba)
    }
    return result


def create_eda_plot(column, plot_type):
    """Generar gr谩fico EDA interactivo."""
    fig, ax = plt.subplots(figsize=(10, 6))

    if plot_type == "Histograma":
        for species in df['species'].unique():
            subset = df[df['species'] == species]
            ax.hist(subset[column], alpha=0.6, label=species, bins=15)
        ax.legend()
    elif plot_type == "Boxplot":
        sns.boxplot(x='species', y=column, data=df, ax=ax)
    elif plot_type == "Violin":
        sns.violinplot(x='species', y=column, data=df, ax=ax)
    elif plot_type == "Scatter (vs petal_length)":
        for species in df['species'].unique():
            subset = df[df['species'] == species]
            ax.scatter(subset[column], subset['petal_length'], alpha=0.7, label=species)
        ax.set_ylabel("petal_length")
        ax.legend()

    ax.set_title(f"{plot_type} de {column}")
    ax.set_xlabel(column)
    plt.tight_layout()
    return fig


def show_correlation():
    """Mostrar matriz de correlaci贸n."""
    fig, ax = plt.subplots(figsize=(8, 6))
    numeric_df = df.select_dtypes(include=[np.number])
    corr = numeric_df.corr()
    mask = np.triu(np.ones_like(corr, dtype=bool))
    sns.heatmap(corr, mask=mask, annot=True, fmt=".2f", cmap="coolwarm", center=0, ax=ax)
    ax.set_title("Matriz de Correlaci贸n")
    plt.tight_layout()
    return fig


def show_pairplot():
    """Generar pairplot."""
    fig = sns.pairplot(df, hue='species', diag_kind='kde', height=2.2)
    return fig.figure


# ============================================================
# INTERFAZ GRADIO
# ============================================================
numeric_cols = ["sepal_length", "sepal_width", "petal_length", "petal_width"]

with gr.Blocks(theme=gr.themes.Soft(), title="Iris Flower Classifier") as demo:
    gr.Markdown(
        """
        # 馃尯 Iris Flower Classifier
        Clasificador de flores Iris usando **XGBoost** entrenado con el
        [dataset de Kaggle](https://www.kaggle.com/datasets/sims22/irisflowerdatasets).
        """
    )

    with gr.Tab("馃敭 Predicci贸n"):
        with gr.Row():
            with gr.Column():
                sl = gr.Slider(*FEATURE_RANGES["sepal_length"], label="Sepal Length (cm)")
                sw = gr.Slider(*FEATURE_RANGES["sepal_width"], label="Sepal Width (cm)")
                pl = gr.Slider(*FEATURE_RANGES["petal_length"], label="Petal Length (cm)")
                pw = gr.Slider(*FEATURE_RANGES["petal_width"], label="Petal Width (cm)")
                predict_btn = gr.Button("Clasificar", variant="primary")
            with gr.Column():
                output_label = gr.Label(num_top_classes=3, label="Predicci贸n")

        predict_btn.click(predict, inputs=[sl, sw, pl, pw], outputs=output_label)

        gr.Examples(
            examples=[
                [5.1, 3.5, 1.4, 0.2],   # Setosa
                [6.2, 2.9, 4.3, 1.3],   # Versicolor
                [7.7, 3.0, 6.1, 2.3],   # Virginica
            ],
            inputs=[sl, sw, pl, pw],
            label="Ejemplos por especie",
        )

    with gr.Tab("馃搳 EDA Interactivo"):
        with gr.Row():
            col_selector = gr.Dropdown(
                choices=numeric_cols, value="petal_length", label="Feature"
            )
            plot_type = gr.Dropdown(
                choices=["Histograma", "Boxplot", "Violin", "Scatter (vs petal_length)"],
                value="Histograma",
                label="Tipo de gr谩fico",
            )
        eda_plot = gr.Plot(label="Visualizaci贸n")
        col_selector.change(create_eda_plot, [col_selector, plot_type], eda_plot)
        plot_type.change(create_eda_plot, [col_selector, plot_type], eda_plot)

        with gr.Row():
            corr_btn = gr.Button("Matriz de Correlaci贸n")
            pair_btn = gr.Button("Pairplot")
        extra_plot = gr.Plot(label="An谩lisis")
        corr_btn.click(show_correlation, outputs=extra_plot)
        pair_btn.click(show_pairplot, outputs=extra_plot)

    with gr.Tab("馃搵 Datos"):
        gr.Markdown("### Dataset Iris (150 muestras)")
        gr.DataFrame(value=df, label="Dataset completo")
        gr.Markdown(f"### Estad铆sticas descriptivas")
        gr.DataFrame(value=df.describe().reset_index(), label="Estad铆sticas")

    with gr.Tab("馃搱 M茅tricas del Modelo"):
        gr.Markdown(f"""
        ### Rendimiento del modelo XGBoost
        - **Test Accuracy**: {model_info['metrics']['test_accuracy']:.4f}
        - **CV Accuracy**: {model_info['metrics']['cv_accuracy_mean']:.4f}{model_info['metrics']['cv_accuracy_std']:.4f}
        - **Clases**: {', '.join(model_info['classes'])}
        """)
        with gr.Row():
            if os.path.exists("outputs/confusion_matrix.png"):
                gr.Image(value="outputs/confusion_matrix.png", label="Confusion Matrix")
            if os.path.exists("outputs/feature_importance.png"):
                gr.Image(value="outputs/feature_importance.png", label="Feature Importance")
        gr.JSON(value=model_info, label="Metadata del modelo")


if __name__ == "__main__":
    demo.launch()