Spaces:
Sleeping
Sleeping
File size: 810 Bytes
406fb75 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 |
# validate.py
import os
import joblib
import pandas as pd
from sklearn.metrics import classification_report
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.multioutput import MultiOutputClassifier
from lightgbm import LGBMClassifier
from config import DATA_PATH, TEXT_COLUMN, LABEL_COLUMNS, MODEL_SAVE_DIR, TFIDF_PATH
# Load validation data
data = pd.read_csv(DATA_PATH)
X = data[TEXT_COLUMN]
y = data[LABEL_COLUMNS]
# Load vectorizer and model
vectorizer = joblib.load(TFIDF_PATH)
X_vectorized = vectorizer.transform(X)
model_path = os.path.join(MODEL_SAVE_DIR, "lgbm_multioutput.pkl")
model = joblib.load(model_path)
# Predict
y_pred = model.predict(X_vectorized)
# Evaluation
print("\nValidation Report:\n")
print(classification_report(y, y_pred, target_names=LABEL_COLUMNS))
|