Spaces:

hansche
/

SocialMediaFoci

Sleeping

Bismark

Update Space

5ab54b7 5 months ago

1.21 kB

	import os
	import joblib
	import string
	import re
	import nltk
	from nltk.corpus import stopwords

	# Get the directory of the current script
	script_dir = os.path.dirname(__file__)

	# Construct paths to the model and vectorizer files
	model_path = os.path.join(script_dir, "naive_bayes_model.pkl")
	vectorizer_path = os.path.join(script_dir, "tfidf_vectorizer.pkl")

	# Load saved model and vectorizer
	try:
	model = joblib.load(model_path)
	vectorizer = joblib.load(vectorizer_path)
	except FileNotFoundError as e:
	print(f"Error: {e}")
	raise

	# Load stopwords
	nltk.download("stopwords")
	stop_words = set(stopwords.words("english") + stopwords.words("french"))

	# Function to clean text (must match preprocessing in training script)
	def clean_text(text):
	if isinstance(text, float):
	return ""
	text = text.lower()
	text = re.sub(f"[{string.punctuation}]", "", text)
	text = " ".join([word for word in text.split() if word not in stop_words])
	return text

	# Function to predict sentiment
	def predict_sentiment(text):
	cleaned_text = clean_text(text)
	vectorized_text = vectorizer.transform([cleaned_text])
	prediction = model.predict(vectorized_text)
	return prediction[0]