Initial release — Darwin-60B-DUO (Hybrid-A: Route 70% / Split-Refine 20% / Ensemble V_1 10%)

c2bfdba verified 2 days ago

2.5 kB

	{
	"_model_type_friendly": "duo",
	"_aggregate_brand": "Darwin-60B-DUO",
	"architectures": [
	"DarwinDuoOrchestrator"
	],
	"description": "Darwin family DUO — two SOTA constituents (English reasoning + Korean) served via a single OpenAI-compatible gateway. This repo contains the orchestrator gateway code; backend weights are fetched from the constituent repos at runtime.",
	"constituents": [
	{
	"role": "english_reasoning_specialist",
	"model_id": "FINAL-Bench/Darwin-28B-REASON",
	"served_name": "darwin-28r",
	"architecture": "qwen3_5",
	"params_total": 26895998464,
	"params_billion": 26.9,
	"verified_rank": "Hugging Face GPQA Diamond #3",
	"default_port": 8021,
	"default_dp_master_port": 45011,
	"quantization_recommended": "fp8",
	"vllm_extra_args": [
	"--enforce-eager",
	"--limit-mm-per-prompt", "{\"image\":0,\"video\":0}"
	]
	},
	{
	"role": "korean_specialist",
	"model_id": "Anserwise/AWAXIS-Think-31B",
	"served_name": "awaxis-31b",
	"architecture": "gemma4",
	"params_total": 31273086512,
	"params_billion": 31.27,
	"verified_rank": "National K-AI Leaderboard (MSIT, Korea) #1",
	"darwin_family_branch": "korean_specialist (Gemma-4 base)",
	"default_port": 8022,
	"default_dp_master_port": 45012,
	"quantization_recommended": "fp8",
	"vllm_extra_args": [
	"--enforce-eager",
	"--limit-mm-per-prompt", "{\"image\":0,\"video\":0}"
	]
	}
	],
	"aggregate_params_total": 58169085976,
	"aggregate_params_billion": 58.17,
	"active_params_router_mode_billion": 30,
	"active_params_ensemble_mode_billion": 60,
	"orchestration": {
	"strategy_name": "Hybrid-A",
	"version": "1.0",
	"distribution": {
	"route_korean": 0.50,
	"route_english": 0.20,
	"split_korean_with_reasoning": 0.15,
	"split_english_with_korean_context": 0.05,
	"ensemble_v1_mcq": 0.10
	},
	"average_cost_multiplier": 1.3,
	"modes": ["route", "split_refine", "ensemble_v1"]
	},
	"gateway": {
	"port": 8000,
	"served_model_name": "darwin-60b-duo",
	"openai_compatible": true,
	"endpoints": ["/v1/models", "/v1/chat/completions", "/v1/completions"]
	},
	"transformers_compatible": false,
	"_note": "This is NOT a direct transformers AutoModel.from_pretrained() target. Use the gateway (gateway/server.py) or Docker Compose (docker/docker-compose.yml). See README for full usage."
	}