#!/usr/bin/env python3 """ Stack 2.9 - Simple Direct Load """ import os # Kill ALL huggingface networking and progress os.environ['HF_HUB_DISABLE_HTTP'] = '1' os.environ['HF_HUB_DISABLE_PROGRESS_BARS'] = '1' os.environ['TRANSFORMERS_OFFLINE'] = '1' os.environ['TOKENIZERS_PARALLELISM'] = 'false' import torch from pathlib import Path import json import warnings warnings.filterwarnings('ignore') model_path = Path("/Users/walidsobhi/stack-2-9-final-model") print("Loading...") # Load tokenizer import io from tokenizers import Tokenizer tokenizer = Tokenizer.from_file(str(model_path / "tokenizer.json")) # Need a PretrainedTokenizer for generation from transformers import PreTrainedTokenizerFast fast_tokenizer = PreTrainedTokenizerFast(tokenizer_file=str(model_path / "tokenizer.json")) fast_tokenizer.pad_token = "<|endoftext|>" fast_tokenizer.eos_token = "<|endoftext|>" print("Tokenizer ready") # Load config with open(model_path / "config.json") as f: cfg = json.load(f) # Load weights using torch directly (no safetensors lib needed for loading) print("Loading safetensors...") import struct # Read safetensors header def load_safetensors_torch(path): """Load safetensors file using torch only""" with open(path, 'rb') as f: # Read header size header_size_bytes = f.read(8) header_size = struct.unpack('