File size: 512 Bytes
0c99808
 
 
4882762
0c99808
 
 
 
e829476
0c99808
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
"""
Load the Hugging Face dataset once as a module-level singleton.

Task-specific columns are declared per task under ``tasks/<name>/spec.py``.
"""

from datasets import load_dataset

from earnings_analyst.environment_config import DATASET_FILE, DATASET_ID

# Loaded once on first import; all resets share this object.
# Pin Hub parquet so we never pick up features.parquet / raw_*.parquet from the same repo.
dataset = load_dataset(
    DATASET_ID,
    data_files={"train": DATASET_FILE},
    split="train",
)