{ "model_type": "sklearn", "task": "regression", "target": "nasa_radiation", "prediction_column": "prediction_label", "library_name": "pycaret", "pycaret_version": "3.2.0", "scikit_learn_version": "1.2.2", "serialization": "pickle", "estimator_class": "sklearn.ensemble.RandomForestRegressor", "pipeline": { "preprocessing": [ { "name": "numerical_imputer", "transformer": "sklearn.impute.SimpleImputer", "includes": ["sp", "t", "r2", "u10", "v10", "SUNSD", "lcc", "mcc", "hcc", "sdswrf"] }, { "name": "categorical_imputer", "transformer": "sklearn.impute.SimpleImputer", "strategy": "most_frequent", "includes": [] }, { "name": "normalize", "transformer": "sklearn.preprocessing.MinMaxScaler" } ], "trained_model": { "name": "RandomForestRegressor", "params": { "n_jobs": -1, "random_state": 123 } } }, "input_schema": { "features": [ { "name": "sp", "dtype": "float" }, { "name": "t", "dtype": "float" }, { "name": "r2", "dtype": "float" }, { "name": "u10", "dtype": "float" }, { "name": "v10", "dtype": "float" }, { "name": "SUNSD", "dtype": "float" }, { "name": "lcc", "dtype": "float" }, { "name": "mcc", "dtype": "float" }, { "name": "hcc", "dtype": "float" }, { "name": "sdswrf", "dtype": "float" } ] }, "evaluation": { "split": "holdout", "rows": 972260, "metrics": { "MAE": 75.50362673902671, "RMSE": 126.1365660235317, "R2": 0.7516510842417514 }, "notes": [ "Metrics computed from MAKING_MODEL/holdout_pred.csv using columns nasa_radiation (true) and prediction_label (pred).", "MAPE is omitted because nasa_radiation can be near zero, which makes percentage errors unstable." ] }, "training_data": { "source_file": "integrated_gfs_nasa_power_2024_full.csv", "notes": [ "See TRAINING_ARTIFACTS/README.md for training/evaluation artifacts and scripts." ] }, "artifacts": { "files": ["Suncast_v1.pkl", "config.json"] } }