{ "_note": "Darwin-60B-DUO uses constituent tokenizers via gateway, not a unified one.", "constituent_tokenizers": { "darwin-28r": { "source_model": "FINAL-Bench/Darwin-28B-REASON", "tokenizer_family": "qwen3_5", "vocab_size_estimate": 151936 }, "awaxis-31b": { "source_model": "Anserwise/AWAXIS-Think-31B", "tokenizer_family": "gemma4", "vocab_size_estimate": 262144 } }, "routing_decision_layer": "language detection + domain classification (gateway/router.py) performs tokenization-free routing on the raw text before backend selection", "downstream_token_handling": "Each backend (vLLM serving the respective base model) handles its own tokenization. The gateway operates on text strings, not token IDs." }