Spaces:
Sleeping
Sleeping
File size: 1,015 Bytes
5d4981c 4edde41 5d4981c 4edde41 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 |
import pandas as pd
import streamlit as st
from pathlib import Path
from huggingface_hub import snapshot_download
import os
@st.cache_data(show_spinner="Loading data...⏳")
def load_dataset(path: str | Path, category: str | None=None):
DATA_OPTIONS = {
'Beauty': 'All_Beauty.parquet',
'Appliances': 'Appliances.parquet',
'Baby Products': 'Baby_Products.parquet',
'Electronics': 'Electronics.parquet',
'Health and Household': 'Health_and_Household.parquet',
'Movies and TV': 'Movies_and_TV.parquet'
}
if category:
data_path = os.path.join(path, DATA_OPTIONS[category])
df = pd.read_parquet(data_path)
else:
df = pd.read_parquet(path)
return df
@st.cache_resource
def get_data_directory():
# This downloads the whole review_data folder from your Dataset repo
data_path = snapshot_download(
repo_id="tkbarb10/ads505-review-data",
repo_type="dataset"
)
return Path(data_path) |