TNSA
/

NGen2-30M

Text Generation

Model card Files Files and versions

NGen2-30M / converter.py

Thishyaketh's picture

Upload 4 files

8e36426 verified 8 months ago

history blame contribute delete

2.03 kB

	import os
	import argparse
	import torch
	from safetensors.torch import save_file

	def extract_state_dict(checkpoint):
	"""
	Extracts the tensor dictionary from common .pth formats.
	"""
	if isinstance(checkpoint, dict):
	for key in ["state_dict", "model", "model_state_dict", "module"]:
	if key in checkpoint and isinstance(checkpoint[key], dict):
	return checkpoint[key]
	return checkpoint

	def convert_pth_to_safetensors(input_path, output_path=None):
	print(f"🔍 Loading checkpoint from: {input_path}")

	try:
	checkpoint = torch.load(input_path, map_location="cpu", weights_only=True)
	except Exception as e:
	print(f"❌ Error loading .pth file: {e}")
	return

	state_dict = extract_state_dict(checkpoint)

	if not isinstance(state_dict, dict):
	print("❌ Invalid checkpoint: not a dictionary.")
	return

	tensor_dict = {k: v for k, v in state_dict.items() if isinstance(v, torch.Tensor)}

	if not tensor_dict:
	print("❌ No tensor values found to convert.")
	return

	# Optionally add "model." prefix to HuggingFace-compatible keys
	if not all(k.startswith("model.") for k in tensor_dict):
	tensor_dict = {f"model.{k}": v for k, v in tensor_dict.items()}

	if output_path is None:
	output_path = os.path.splitext(input_path)[0] + ".safetensors"

	try:
	print(f"💾 Saving to: {output_path}")
	save_file(tensor_dict, output_path)
	print("✅ Conversion to .safetensors successful!")
	except Exception as e:
	print(f"❌ Saving failed: {e}")

	if __name__ == "__main__":
	parser = argparse.ArgumentParser(description="Convert .pth to .safetensors")
	parser.add_argument("input", help="Path to input .pth file")
	parser.add_argument("--output", help="Path to output .safetensors file (optional)")

	args = parser.parse_args()
	convert_pth_to_safetensors(args.input, args.output)