Spaces:
Sleeping
Sleeping
Update superkart_sales_forecast.pkl
Browse files- superkart_sales_forecast.pkl +30 -8
superkart_sales_forecast.pkl
CHANGED
|
@@ -1,26 +1,48 @@
|
|
|
|
|
|
|
|
| 1 |
import joblib
|
| 2 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4 |
|
| 5 |
# -----------------------------
|
| 6 |
# Select Final Model Based on RMSE
|
| 7 |
# -----------------------------
|
| 8 |
-
# 'rf_best_model' and 'gb_best_model' are tuned models (Random Forest, Gradient Boosting)
|
| 9 |
best_model = rf_best_model if performance_df["RMSE"].idxmin() == "Random Forest (Tuned)" else gb_best_model
|
| 10 |
|
| 11 |
-
#
|
| 12 |
final_predictions = best_model.predict(X_test)
|
| 13 |
final_metrics = evaluate_model(y_test, final_predictions)
|
| 14 |
|
| 15 |
-
print("\
|
| 16 |
-
print("
|
| 17 |
|
| 18 |
# -----------------------------
|
| 19 |
# Serialize the Best Model
|
| 20 |
# -----------------------------
|
| 21 |
-
model_filename = "superkart_sales_forecast.pkl"
|
| 22 |
joblib.dump(best_model, model_filename)
|
| 23 |
-
print(f"\
|
| 24 |
|
| 25 |
# -----------------------------
|
| 26 |
# Load and Validate the Model
|
|
@@ -29,4 +51,4 @@ loaded_model = joblib.load(model_filename)
|
|
| 29 |
loaded_predictions = loaded_model.predict(X_test)
|
| 30 |
loaded_metrics = evaluate_model(y_test, loaded_predictions)
|
| 31 |
|
| 32 |
-
print("\
|
|
|
|
| 1 |
+
# model_export.py
|
| 2 |
+
|
| 3 |
import joblib
|
| 4 |
+
import pandas as pd
|
| 5 |
+
from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor # or whatever models you trained
|
| 6 |
+
|
| 7 |
+
# Replace with your actual evaluation function
|
| 8 |
+
def evaluate_model(y_true, y_pred):
|
| 9 |
+
from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score
|
| 10 |
+
return {
|
| 11 |
+
"RMSE": mean_squared_error(y_true, y_pred, squared=False),
|
| 12 |
+
"MAE": mean_absolute_error(y_true, y_pred),
|
| 13 |
+
"R2": r2_score(y_true, y_pred)
|
| 14 |
+
}
|
| 15 |
+
|
| 16 |
+
# Assume rf_best_model and gb_best_model are already trained
|
| 17 |
+
# Also assume we have performance_df with RMSE values
|
| 18 |
|
| 19 |
+
# Example: Simulate performance_df (you should use the real one)
|
| 20 |
+
# import pandas as pd
|
| 21 |
+
# performance_df = pd.DataFrame({
|
| 22 |
+
# "RMSE": {
|
| 23 |
+
# "Random Forest (Tuned)": 113.52,
|
| 24 |
+
# "Gradient Boosting (Tuned)": 119.40
|
| 25 |
+
# }
|
| 26 |
+
# })
|
| 27 |
|
| 28 |
# -----------------------------
|
| 29 |
# Select Final Model Based on RMSE
|
| 30 |
# -----------------------------
|
|
|
|
| 31 |
best_model = rf_best_model if performance_df["RMSE"].idxmin() == "Random Forest (Tuned)" else gb_best_model
|
| 32 |
|
| 33 |
+
# Predict and evaluate
|
| 34 |
final_predictions = best_model.predict(X_test)
|
| 35 |
final_metrics = evaluate_model(y_test, final_predictions)
|
| 36 |
|
| 37 |
+
print("\nBest Model Selected:", performance_df['RMSE'].idxmin())
|
| 38 |
+
print("Performance on Test Set:", final_metrics)
|
| 39 |
|
| 40 |
# -----------------------------
|
| 41 |
# Serialize the Best Model
|
| 42 |
# -----------------------------
|
| 43 |
+
model_filename = "superkart_sales_forecast.pkl"
|
| 44 |
joblib.dump(best_model, model_filename)
|
| 45 |
+
print(f"\nModel serialized and saved as: {model_filename}")
|
| 46 |
|
| 47 |
# -----------------------------
|
| 48 |
# Load and Validate the Model
|
|
|
|
| 51 |
loaded_predictions = loaded_model.predict(X_test)
|
| 52 |
loaded_metrics = evaluate_model(y_test, loaded_predictions)
|
| 53 |
|
| 54 |
+
print("\nLoaded Model Performance on Test Set:", loaded_metrics)
|