Spaces:
Sleeping
Sleeping
| # validate.py | |
| import os | |
| import joblib | |
| import pandas as pd | |
| from sklearn.metrics import classification_report | |
| from sklearn.feature_extraction.text import TfidfVectorizer | |
| from sklearn.multioutput import MultiOutputClassifier | |
| from lightgbm import LGBMClassifier | |
| from config import DATA_PATH, TEXT_COLUMN, LABEL_COLUMNS, MODEL_SAVE_DIR, TFIDF_PATH | |
| # Load validation data | |
| data = pd.read_csv(DATA_PATH) | |
| X = data[TEXT_COLUMN] | |
| y = data[LABEL_COLUMNS] | |
| # Load vectorizer and model | |
| vectorizer = joblib.load(TFIDF_PATH) | |
| X_vectorized = vectorizer.transform(X) | |
| model_path = os.path.join(MODEL_SAVE_DIR, "lgbm_multioutput.pkl") | |
| model = joblib.load(model_path) | |
| # Predict | |
| y_pred = model.predict(X_vectorized) | |
| # Evaluation | |
| print("\nValidation Report:\n") | |
| print(classification_report(y, y_pred, target_names=LABEL_COLUMNS)) | |