deva8217 commited on
Commit
6fe1cc9
·
verified ·
1 Parent(s): cb3caaa

Update superkart_sales_forecast.pkl

Browse files
Files changed (1) hide show
  1. superkart_sales_forecast.pkl +30 -8
superkart_sales_forecast.pkl CHANGED
@@ -1,26 +1,48 @@
 
 
1
  import joblib
2
- from sklearn.ensemble import RandomForestRegressor # or your actual model
 
 
 
 
 
 
 
 
 
 
 
 
 
3
 
 
 
 
 
 
 
 
 
4
 
5
  # -----------------------------
6
  # Select Final Model Based on RMSE
7
  # -----------------------------
8
- # 'rf_best_model' and 'gb_best_model' are tuned models (Random Forest, Gradient Boosting)
9
  best_model = rf_best_model if performance_df["RMSE"].idxmin() == "Random Forest (Tuned)" else gb_best_model
10
 
11
- # Make predictions and evaluate
12
  final_predictions = best_model.predict(X_test)
13
  final_metrics = evaluate_model(y_test, final_predictions)
14
 
15
- print("\n Best Model Selected:", performance_df['RMSE'].idxmin())
16
- print(" Performance on Test Set:", final_metrics)
17
 
18
  # -----------------------------
19
  # Serialize the Best Model
20
  # -----------------------------
21
- model_filename = "superkart_sales_forecast.pkl" # Hugging Face expects this name
22
  joblib.dump(best_model, model_filename)
23
- print(f"\n Model serialized and saved as: {model_filename}")
24
 
25
  # -----------------------------
26
  # Load and Validate the Model
@@ -29,4 +51,4 @@ loaded_model = joblib.load(model_filename)
29
  loaded_predictions = loaded_model.predict(X_test)
30
  loaded_metrics = evaluate_model(y_test, loaded_predictions)
31
 
32
- print("\n Loaded Model Performance on Test Set:", loaded_metrics)
 
1
+ # model_export.py
2
+
3
  import joblib
4
+ import pandas as pd
5
+ from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor # or whatever models you trained
6
+
7
+ # Replace with your actual evaluation function
8
+ def evaluate_model(y_true, y_pred):
9
+ from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score
10
+ return {
11
+ "RMSE": mean_squared_error(y_true, y_pred, squared=False),
12
+ "MAE": mean_absolute_error(y_true, y_pred),
13
+ "R2": r2_score(y_true, y_pred)
14
+ }
15
+
16
+ # Assume rf_best_model and gb_best_model are already trained
17
+ # Also assume we have performance_df with RMSE values
18
 
19
+ # Example: Simulate performance_df (you should use the real one)
20
+ # import pandas as pd
21
+ # performance_df = pd.DataFrame({
22
+ # "RMSE": {
23
+ # "Random Forest (Tuned)": 113.52,
24
+ # "Gradient Boosting (Tuned)": 119.40
25
+ # }
26
+ # })
27
 
28
  # -----------------------------
29
  # Select Final Model Based on RMSE
30
  # -----------------------------
 
31
  best_model = rf_best_model if performance_df["RMSE"].idxmin() == "Random Forest (Tuned)" else gb_best_model
32
 
33
+ # Predict and evaluate
34
  final_predictions = best_model.predict(X_test)
35
  final_metrics = evaluate_model(y_test, final_predictions)
36
 
37
+ print("\nBest Model Selected:", performance_df['RMSE'].idxmin())
38
+ print("Performance on Test Set:", final_metrics)
39
 
40
  # -----------------------------
41
  # Serialize the Best Model
42
  # -----------------------------
43
+ model_filename = "superkart_sales_forecast.pkl"
44
  joblib.dump(best_model, model_filename)
45
+ print(f"\nModel serialized and saved as: {model_filename}")
46
 
47
  # -----------------------------
48
  # Load and Validate the Model
 
51
  loaded_predictions = loaded_model.predict(X_test)
52
  loaded_metrics = evaluate_model(y_test, loaded_predictions)
53
 
54
+ print("\nLoaded Model Performance on Test Set:", loaded_metrics)