Spaces:

Julseb42
/

nlp-project

Sleeping

nlp-project / scripts /test_functions-checkpoint.py

Test deploy

8e83170 12 months ago

1.24 kB

	from importlib import reload
	import sys

	sys.path.append("..")

	# Reload modules to make sure the latest code is used
	import scripts.get_dataset
	import utils.text_cleaning
	import utils.data_process # optional

	reload(scripts.get_dataset)
	reload(utils.text_cleaning)
	reload(utils.data_process)

	# Import functions
	from scripts.get_dataset import load_data
	from utils.text_cleaning import preprocess_reviews

	# Check load_data
	print("\nChecking load_data...")
	try:
	df = load_data()
	print("load_data() succeeded.")
	print("Shape:", df.shape)
	print("Columns:", df.columns.tolist())
	except Exception as e:
	print("load_data() failed:", e)

	# Check 'reviews.text' column ===
	print("\nChecking 'reviews.text' column...")
	if "reviews.text" in df.columns:
	print("'reviews.text' column found.")
	else:
	print("'reviews.text' column is missing. Check dataset format.")

	# Check preprocess_reviews ===
	print("\nChecking preprocess_reviews...")
	try:
	df_sample = df.head(3).copy()
	df_cleaned = preprocess_reviews(df_sample, column="reviews.text")
	print("preprocess_reviews() succeeded.")
	print("Sample cleaned text:\n", df_cleaned["reviews.text"])
	except Exception as e:
	print("preprocess_reviews() failed:", e)