ZombitX64
/

GPT4All-Model

Model card Files Files and versions

GPT4All-Model / hanuman_pkg /__init__.py

JonusNattapong's picture

Upload trained model

75d2985 verified 4 months ago

history blame contribute delete

3.55 kB

	"""hanuman_pkg

	Helper to load the custom Hanuman model directly from a Hugging Face repo.

	Usage:
	from hanuman_pkg import from_pretrained
	model, tokenizer = from_pretrained("ZombitX64/GPT4All-Model")

	This will download `modeling.py`, `config.json` and `pytorch_model.bin` (if present)
	from the repo and dynamically import the Hanuman class.
	"""
	from __future__ import annotations

	import importlib.util
	import json
	import os
	import tempfile
	from typing import Tuple

	import torch
	from huggingface_hub import hf_hub_download
	from transformers import AutoTokenizer


	def _download_file(repo_id: str, filename: str) -> str:
	"""Try to download `filename` from repo_id. Return local path or raise."""
	try:
	return hf_hub_download(repo_id, filename)
	except Exception:
	# try with common subfolder used by this repo
	try:
	return hf_hub_download(repo_id, os.path.join("out_run1", "epoch-3", filename))
	except Exception as e:
	raise RuntimeError(f"Failed to download {filename} from repo {repo_id}: {e}")


	def _load_module_from_path(path: str, module_name: str):
	spec = importlib.util.spec_from_file_location(module_name, path)
	mod = importlib.util.module_from_spec(spec)
	loader = spec.loader
	assert loader is not None
	loader.exec_module(mod)
	return mod


	def from_pretrained(repo_id: str, map_location: str = "cpu") -> Tuple[torch.nn.Module, object]:
	"""Download model artifacts from HF and return (model, tokenizer).

	Args:
	repo_id: Hugging Face repo id, e.g. "username/model-repo"
	map_location: device string for torch.load

	Returns:
	model: Hanuman model instance (on CPU unless moved)
	tokenizer: transformers tokenizer loaded from the repo
	"""
	# Load tokenizer via transformers (works directly with HF repos)
	tokenizer = AutoTokenizer.from_pretrained(repo_id)

	# Download config
	cfg_path = _download_file(repo_id, "config.json")
	with open(cfg_path, "r", encoding="utf-8") as f:
	cfg = json.load(f)

	# Download modeling.py and import it dynamically
	modeling_path = _download_file(repo_id, "modeling.py")
	modeling_mod = _load_module_from_path(modeling_path, "hanuman_modeling")

	if not hasattr(modeling_mod, "Hanuman"):
	raise RuntimeError("Downloaded modeling.py does not define Hanuman class")

	Hanuman = modeling_mod.Hanuman

	# Instantiate model using values from config
	model = Hanuman(
	vocab_size=cfg.get("vocab_size", 32000),
	n_positions=cfg.get("n_positions", cfg.get("n_ctx", 4096)),
	n_embd=cfg.get("n_embd", 512),
	n_layer=cfg.get("n_layer", 8),
	n_head=cfg.get("n_head", 8),
	use_think_head=cfg.get("use_think_head", True),
	)

	# Download weights (prefer safetensors if available)
	# Try safetensors first
	state_path = None
	try:
	state_path = _download_file(repo_id, "pytorch_model.safetensors")
	except Exception:
	try:
	state_path = _download_file(repo_id, "pytorch_model.bin")
	except Exception as e:
	raise RuntimeError(f"Failed to download model weights: {e}")

	# Load state dict
	# For safetensors, the dyn loader in modeling.from_pretrained uses safetensors; here we'll rely on torch.load
	state = torch.load(state_path, map_location=map_location)
	model.load_state_dict(state)

	return model, tokenizer