|
|
|
|
|
""" |
|
|
HuggingFace Checkpoint Uploader for AGILLM-3 |
|
|
Usage: python hf_upload.py <checkpoint.pt> [--message "commit msg"] |
|
|
Requires: HF_TOKEN env var or ~/.huggingface/token |
|
|
""" |
|
|
import os |
|
|
import sys |
|
|
import argparse |
|
|
from pathlib import Path |
|
|
from datetime import datetime |
|
|
|
|
|
try: |
|
|
from huggingface_hub import HfApi, upload_file |
|
|
except ImportError: |
|
|
print("Installing huggingface_hub...") |
|
|
os.system("pip install huggingface_hub -q") |
|
|
from huggingface_hub import HfApi, upload_file |
|
|
|
|
|
REPO_ID = "OpenTransformer/AGILLM-3-large" |
|
|
|
|
|
def upload_checkpoint(ckpt_path: str, message: str = None): |
|
|
path = Path(ckpt_path) |
|
|
if not path.exists(): |
|
|
print(f"Error: {ckpt_path} not found") |
|
|
return False |
|
|
|
|
|
token = os.environ.get("HF_TOKEN") or None |
|
|
api = HfApi(token=token) |
|
|
|
|
|
|
|
|
step = "unknown" |
|
|
if "step" in path.stem: |
|
|
step = path.stem.split("step")[-1].split(".")[0] |
|
|
|
|
|
ts = datetime.now().strftime("%Y-%m-%d %H:%M") |
|
|
commit_msg = message or f"Checkpoint step {step} - {ts}" |
|
|
|
|
|
print(f"Uploading {path.name} to {REPO_ID}...") |
|
|
print(f"Size: {path.stat().st_size / 1e9:.2f} GB") |
|
|
|
|
|
try: |
|
|
upload_file( |
|
|
path_or_fileobj=str(path), |
|
|
path_in_repo=f"checkpoints/{path.name}", |
|
|
repo_id=REPO_ID, |
|
|
commit_message=commit_msg, |
|
|
token=token |
|
|
) |
|
|
print(f"SUCCESS: https://huggingface.co/{REPO_ID}") |
|
|
return True |
|
|
except Exception as e: |
|
|
print(f"Upload failed: {e}") |
|
|
return False |
|
|
|
|
|
if __name__ == "__main__": |
|
|
parser = argparse.ArgumentParser() |
|
|
parser.add_argument("checkpoint", help="Path to checkpoint .pt file") |
|
|
parser.add_argument("--message", "-m", help="Commit message") |
|
|
args = parser.parse_args() |
|
|
|
|
|
success = upload_checkpoint(args.checkpoint, args.message) |
|
|
sys.exit(0 if success else 1) |
|
|
|