rahul7star commited on
Commit
33779ec
·
verified ·
1 Parent(s): 56ede89

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -28
app.py CHANGED
@@ -1,45 +1,28 @@
1
  import math
2
  import gradio as gr
3
  import pandas as pd
4
- from huggingface_hub import HfApi, hf_hub_download
5
 
6
  # ======================================================
7
  # CONFIG
8
  # ======================================================
9
- DATASET_REPO = "rahul7star/Wan-video"
10
- CSV_FILE = "train.csv"
11
 
12
  VIDEO_COL = "video"
13
  TEXT_COL = "text"
14
  DATE_COL = "date"
15
 
16
  # ======================================================
17
- # AUTH + DATA LOAD (LEARNED FROM YOUR SAMPLE)
18
  # ======================================================
19
- api = HfApi() # auto-reads HUGGINGFACE_HUB_TOKEN
 
 
 
20
 
21
-
22
- def load_dataset_csv():
23
- """
24
- Validate repo access and load CSV from private dataset.
25
- """
26
- # 1️⃣ Permission + existence check
27
- api.repo_info(repo_id=DATASET_REPO, repo_type="dataset")
28
-
29
- # 2️⃣ Download CSV (auth handled implicitly)
30
- csv_path = hf_hub_download(
31
- repo_id=DATASET_REPO,
32
- filename=CSV_FILE,
33
- repo_type="dataset"
34
- )
35
-
36
- # 3️⃣ Load dataframe
37
- df = pd.read_csv(csv_path)
38
- df = df[[VIDEO_COL, TEXT_COL, DATE_COL]].dropna().reset_index(drop=True)
39
- return df
40
-
41
-
42
- df = load_dataset_csv()
43
 
44
  # ======================================================
45
  # PAGINATION LOGIC
@@ -149,7 +132,7 @@ with gr.Blocks(theme=gr.themes.Soft(), css=css) as demo:
149
  gr.Markdown(
150
  """
151
  # 🎬 Wan Video Dataset Showcase
152
- Securely browsing a **private Hugging Face dataset**.
153
  """
154
  )
155
 
 
1
  import math
2
  import gradio as gr
3
  import pandas as pd
4
+ from datasets import load_dataset
5
 
6
  # ======================================================
7
  # CONFIG
8
  # ======================================================
9
+ DATASET_NAME = "rahul7star/Wan-video"
 
10
 
11
  VIDEO_COL = "video"
12
  TEXT_COL = "text"
13
  DATE_COL = "date"
14
 
15
  # ======================================================
16
+ # LOAD DATASET (PRIVATE-SAFE)
17
  # ======================================================
18
+ # Auth is handled automatically via:
19
+ # - `huggingface-cli login`
20
+ # - or HUGGINGFACE_HUB_TOKEN env var
21
+ dataset = load_dataset(DATASET_NAME, split="train")
22
 
23
+ # Convert to pandas for easy slicing
24
+ df = dataset.to_pandas()
25
+ df = df[[VIDEO_COL, TEXT_COL, DATE_COL]].dropna().reset_index(drop=True)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
 
27
  # ======================================================
28
  # PAGINATION LOGIC
 
132
  gr.Markdown(
133
  """
134
  # 🎬 Wan Video Dataset Showcase
135
+ Powered by **Hugging Face Datasets** (private-safe).
136
  """
137
  )
138