Spaces:
Sleeping
Sleeping
| import kagglehub | |
| import shutil | |
| import os | |
| # Download the dataset from Kaggle | |
| path = kagglehub.dataset_download("datafiniti/consumer-reviews-of-amazon-products") | |
| # Check if the file already exists in ../dataset | |
| dataset_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "..", "dataset") | |
| target_csv = "Datafiniti_Amazon_Consumer_Reviews_of_Amazon_Products_May19.csv" | |
| target_csv_path = os.path.join(dataset_dir, target_csv) | |
| if os.path.exists(target_csv_path): | |
| main_csv = target_csv | |
| path = dataset_dir # Set path to dataset directory for consistency | |
| else: | |
| # Find the main CSV file in the downloaded dataset | |
| csv_files = [f for f in os.listdir(path) if f.endswith(".csv")] | |
| main_csv = csv_files[0] # Use the first CSV file found | |
| # Save the main CSV file to the ./dataset directory | |
| os.makedirs("dataset", exist_ok=True) | |
| shutil.copy(os.path.join(path, main_csv), os.path.join("dataset", main_csv)) | |
| # Find the first CSV file in the dataset directory | |
| files = [f for f in os.listdir(path) if f.endswith(".csv")] | |
| csv_file = os.path.join(path, files[0]) | |