File size: 4,355 Bytes

a3a4cf2

import gradio as gr
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, LabelEncoder
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import (
    accuracy_score, precision_score, recall_score, f1_score,
    confusion_matrix, classification_report
)
import seaborn as sns
import matplotlib.pyplot as plt


def train_and_evaluate_model():
    # Generate synthetic data
    np.random.seed(42)
    n_records = 10000
    data = {
        'pe_ratio': np.random.uniform(5, 50, n_records),
        'de_ratio': np.random.uniform(0.1, 3.0, n_records),
        'roe': np.random.uniform(5, 40, n_records),
        'market_cap': np.random.uniform(500, 100000, n_records),
        'dividend_yield': np.random.uniform(0.5, 5.0, n_records),
        'stock_rating': np.random.choice(['Buy', 'Hold', 'Sell'], n_records, p=[0.4, 0.4, 0.2])
    }

    df = pd.DataFrame(data)

    # Prepare data
    X = df.drop('stock_rating', axis=1)
    y = df['stock_rating']

    le = LabelEncoder()
    y_encoded = le.fit_transform(y)

    # Split
    X_train, X_test, y_train, y_test = train_test_split(
        X, y_encoded, test_size=0.2, random_state=42, stratify=y_encoded
    )

    # Scale
    scaler = StandardScaler()
    X_train_scaled = scaler.fit_transform(X_train)
    X_test_scaled = scaler.transform(X_test)

    # Train
    model = RandomForestClassifier(random_state=42)
    model.fit(X_train_scaled, y_train)

    # Predict
    y_pred = model.predict(X_test_scaled)
    y_test_labels = le.inverse_transform(y_test)
    y_pred_labels = le.inverse_transform(y_pred)

    # Metrics
    acc = accuracy_score(y_test_labels, y_pred_labels)
    prec = precision_score(y_test_labels, y_pred_labels, average='weighted', zero_division=0)
    rec = recall_score(y_test_labels, y_pred_labels, average='weighted', zero_division=0)
    f1 = f1_score(y_test_labels, y_pred_labels, average='weighted', zero_division=0)

    # Classification report image
    report_dict = classification_report(y_test_labels, y_pred_labels, output_dict=True, zero_division=0)
    report_df = pd.DataFrame(report_dict).transpose().round(2)

    fig, ax = plt.subplots(figsize=(8, 4))
    ax.axis('off')
    tbl = ax.table(
        cellText=report_df.values,
        colLabels=report_df.columns,
        rowLabels=report_df.index,
        cellLoc='center',
        loc='center'
    )
    tbl.auto_set_font_size(False)
    tbl.set_fontsize(10)
    tbl.scale(1.2, 1.2)
    for key, cell in tbl.get_celld().items():
        cell.set_linewidth(0.8)
    cr_path = "classification_report.png"
    plt.savefig(cr_path, bbox_inches='tight')
    plt.close()

    # Confusion matrix image
    cm = confusion_matrix(y_test_labels, y_pred_labels, labels=le.classes_)
    plt.figure(figsize=(6, 5))
    sns.heatmap(cm, annot=True, fmt="d", cmap="Blues",
                xticklabels=le.classes_, yticklabels=le.classes_)
    plt.xlabel("Predicted")
    plt.ylabel("Actual")
    plt.title("Confusion Matrix")
    cm_path = "confusion_matrix.png"
    plt.savefig(cm_path, bbox_inches='tight')
    plt.close()

    # Output metrics as Markdown
    output = f"""
### ✅ Evaluation Metrics:
- **Accuracy:** {acc:.2f}
- **Precision:** {prec:.2f}
- **Recall:** {rec:.2f}
- **F1 Score:** {f1:.2f}
"""

    return output, cr_path, cm_path


# Gradio Interface
with gr.Blocks() as demo:
    gr.Markdown("## 🧠 Stock Rating Prediction Model Evaluation")
    gr.Markdown("Click the button below to train the model on synthetic stock data and evaluate its performance.")

    eval_btn = gr.Button("Run Model Evaluation")

    with gr.Row():
        with gr.Column():
            output_md = gr.Markdown()  # Visible Markdown for metrics
        
        with gr.Column():
            gr.Markdown("### 📌 Benchmark Guide\n\n")
            benchmark_img = gr.Image(
                value="Model_Benchmark.png",
                type="filepath",
                show_label=False  # No label shown
            )

    with gr.Row():
        report_img = gr.Image(type="filepath", label="📊 Classification Report")
        cm_img = gr.Image(type="filepath", label="📉 Confusion Matrix")

    eval_btn.click(
        fn=train_and_evaluate_model,
        outputs=[output_md, report_img, cm_img]
    )

demo.launch()