{ "name": "SAM Tokenizer", "architecture": "NexusBPE", "organization": "AMFORGE", "version": "1.0", "vocab_size": 12000, "pad_id": 0, "bos_id": 1, "eos_id": 2, "unk_id": 3, "domains": [ "ROS", "HTTP", "MQTT", "DB", "WORKFLOW", "ECOMMERCE", "VEHICLE", "HOME", "CAL", "FILE" ], "structural_markers": [ "", "", "", "", "", "", "", "", "", "" ], "guarantees": [ "atomic numerics in supported ranges", "atomic domain markers and structural tags", "deterministic encoding", "bit-perfect roundtrip on structured payloads" ], "license": "apache-2.0", "homepage": "https://huggingface.co/AMFORGE/sam_tokenizer" }