Spaces:
Sleeping
Sleeping
| from pathlib import Path | |
| from datasets import load_dataset | |
| def main(): | |
| project_dir = Path(__file__).resolve().parents[2] | |
| raw_dir = project_dir / "data" / "raw" | |
| raw_dir.mkdir(parents=True, exist_ok=True) | |
| ds = load_dataset("Yvnminc/ExioNAICS", split="train") | |
| df = ds.to_pandas() | |
| out_path = raw_dir / "exionaics_raw.csv" | |
| df.to_csv(out_path, index=False) | |
| print(f"Saved raw data to: {out_path}") | |
| print(f"Shape: {df.shape}") | |
| print("\nColumns:") | |
| print(df.columns.tolist()) | |
| print("\nHead:") | |
| print(df.head()) | |
| if __name__ == "__main__": | |
| main() |