Spaces:
Sleeping
Sleeping
File size: 1,223 Bytes
9d8621a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 | #!/usr/bin/env python3
"""Register dataset to Hugging Face Hub"""
import os
import logging
from huggingface_hub import HfApi, create_repo
from huggingface_hub.utils import RepositoryNotFoundError
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
HF_TOKEN = os.getenv("HF_TOKEN")
HF_USERNAME = os.getenv("HF_USERNAME", "SharleyK")
DATASET_NAME = os.getenv("DATASET_NAME", "PredictiveMaintenance")
repo_id = f"{HF_USERNAME}/{DATASET_NAME}"
if not HF_TOKEN:
raise ValueError("HF_TOKEN not set!")
logger.info(f"Registering dataset: {repo_id}")
api = HfApi(token=HF_TOKEN)
try:
api.repo_info(repo_id=repo_id, repo_type="dataset")
logger.info(f"✓ Repository exists: {repo_id}")
except RepositoryNotFoundError:
create_repo(repo_id=repo_id, repo_type="dataset", token=HF_TOKEN, private=False)
logger.info(f"✓ Created repository: {repo_id}")
if os.path.exists("data/engine_data.csv"):
api.upload_file(
path_or_fileobj="data/engine_data.csv",
path_in_repo="engine_data.csv",
repo_id=repo_id,
repo_type="dataset",
token=HF_TOKEN
)
logger.info("✓ Uploaded engine_data.csv")
logger.info("✓ Data registration completed!")
|