{
  "_note": "Darwin-60B-DUO uses constituent tokenizers via gateway, not a unified one.",
  "constituent_tokenizers": {
    "darwin-28r": {
      "source_model": "FINAL-Bench/Darwin-28B-REASON",
      "tokenizer_family": "qwen3_5",
      "vocab_size_estimate": 151936
    },
    "awaxis-31b": {
      "source_model": "Anserwise/AWAXIS-Think-31B",
      "tokenizer_family": "gemma4",
      "vocab_size_estimate": 262144
    }
  },
  "routing_decision_layer": "language detection + domain classification (gateway/router.py) performs tokenization-free routing on the raw text before backend selection",
  "downstream_token_handling": "Each backend (vLLM serving the respective base model) handles its own tokenization. The gateway operates on text strings, not token IDs."
}