Spaces:
Sleeping
Sleeping
| import pandas as pd | |
| import streamlit as st | |
| from pathlib import Path | |
| from huggingface_hub import snapshot_download | |
| import os | |
| def load_dataset(path: str | Path, category: str | None=None): | |
| DATA_OPTIONS = { | |
| 'Beauty': 'All_Beauty.parquet', | |
| 'Appliances': 'Appliances.parquet', | |
| 'Baby Products': 'Baby_Products.parquet', | |
| 'Electronics': 'Electronics.parquet', | |
| 'Health and Household': 'Health_and_Household.parquet', | |
| 'Movies and TV': 'Movies_and_TV.parquet' | |
| } | |
| if category: | |
| data_path = os.path.join(path, DATA_OPTIONS[category]) | |
| df = pd.read_parquet(data_path) | |
| else: | |
| df = pd.read_parquet(path) | |
| return df | |
| def get_data_directory(): | |
| # This downloads the whole review_data folder from your Dataset repo | |
| data_path = snapshot_download( | |
| repo_id="tkbarb10/ads505-review-data", | |
| repo_type="dataset" | |
| ) | |
| return Path(data_path) |