diff --git "a/data/providers.json" "b/data/providers.json" --- "a/data/providers.json" +++ "b/data/providers.json" @@ -69,8 +69,7 @@ "size_b": 120, "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-120b" }, @@ -82,8 +81,7 @@ "currency": "USD", "size_b": 70, "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "meta-llama/Llama-3.3-70B-Instruct" }, @@ -220,8 +218,7 @@ "size_b": 120, "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-120b" }, @@ -251,7 +248,9 @@ "type": "embedding", "input_price_per_1m": 0, "output_price_per_1m": 0, - "currency": "CHF" + "currency": "CHF", + "hf_id": "sentence-transformers/all-MiniLM-L12-v2", + "size_b": 0.03 }, { "name": "Qwen3-Embedding-8B", @@ -266,7 +265,8 @@ "type": "audio", "input_price_per_1m": 0.006, "output_price_per_1m": 0, - "currency": "CHF" + "currency": "CHF", + "hf_id": "openai/whisper-large-v3" }, { "name": "Photomaker V2", @@ -312,8 +312,7 @@ "audio", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -338,8 +337,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -353,8 +351,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -367,8 +364,7 @@ "capabilities": [ "vision", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -381,8 +377,7 @@ "capabilities": [ "vision", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -409,8 +404,7 @@ "capabilities": [ "vision", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -423,8 +417,7 @@ "capabilities": [ "vision", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -472,8 +465,7 @@ "provider_upstream": "Meta", "capabilities": [ "vision", - "tools", - "eu-endpoint" + "tools" ], "size_b": 17, "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct" @@ -489,8 +481,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -502,8 +493,7 @@ "size_b": 70, "provider_upstream": "Meta", "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "meta-llama/Llama-3.3-70B-Instruct" }, @@ -518,8 +508,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -533,8 +522,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -548,8 +536,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -563,8 +550,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -578,8 +564,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -592,8 +577,7 @@ "capabilities": [ "vision", "files", - "tools", - "eu-endpoint" + "tools" ] }, { @@ -607,8 +591,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -622,8 +605,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -636,8 +618,7 @@ "capabilities": [ "vision", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -706,8 +687,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -721,8 +701,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -736,8 +715,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -751,8 +729,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -766,8 +743,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -781,8 +757,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -796,8 +771,7 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" ] }, { @@ -825,203 +799,3056 @@ "vision", "files", "tools", - "reasoning", - "eu-endpoint" + "reasoning" + ] + }, + { + "name": "GPT-5 Mini", + "type": "vision", + "input_price_per_1m": 0.23, + "output_price_per_1m": 1.86, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools", + "reasoning" + ] + }, + { + "name": "GPT-5", + "type": "vision", + "input_price_per_1m": 1.16, + "output_price_per_1m": 9.32, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools", + "reasoning" + ] + }, + { + "name": "GPT-4o Mini", + "type": "vision", + "input_price_per_1m": 0.14, + "output_price_per_1m": 0.56, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools" + ] + }, + { + "name": "GPT-4.1 nano", + "type": "vision", + "input_price_per_1m": 0.09, + "output_price_per_1m": 0.37, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools" + ] + }, + { + "name": "GPT-4o", + "type": "vision", + "input_price_per_1m": 2.56, + "output_price_per_1m": 10.25, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools" + ] + }, + { + "name": "GPT-4.1", + "type": "vision", + "input_price_per_1m": 1.86, + "output_price_per_1m": 7.45, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools" + ] + }, + { + "name": "GPT-4.1 mini", + "type": "vision", + "input_price_per_1m": 0.37, + "output_price_per_1m": 1.49, + "currency": "EUR", + "provider_upstream": "OpenAI", + "capabilities": [ + "vision", + "files", + "tools" + ] + }, + { + "name": "Gemini 3 Flash Preview", + "type": "vision", + "input_price_per_1m": 0.47, + "output_price_per_1m": 2.8, + "currency": "EUR", + "provider_upstream": "Google", + "capabilities": [ + "vision", + "video", + "audio", + "files", + "tools", + "reasoning" + ] + }, + { + "name": "GPT oss (120b)", + "type": "chat", + "input_price_per_1m": 0.28, + "output_price_per_1m": 2.33, + "currency": "EUR", + "size_b": 120, + "provider_upstream": "OpenAI", + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "openai/gpt-oss-120b" + }, + { + "name": "Gemini 2.5 Flash", + "type": "vision", + "input_price_per_1m": 0.28, + "output_price_per_1m": 2.33, + "currency": "EUR", + "provider_upstream": "Google", + "capabilities": [ + "vision", + "video", + "audio", + "files", + "tools", + "reasoning" + ] + }, + { + "name": "Gemini 2.5 Pro Reasoning", + "type": "vision", + "input_price_per_1m": 2.33, + "output_price_per_1m": 13.98, + "currency": "EUR", + "provider_upstream": "Google", + "capabilities": [ + "vision", + "video", + "audio", + "files", + "tools", + "reasoning" ] }, { - "name": "GPT-5 Mini", + "name": "Gemini 2.5 Pro", + "type": "vision", + "input_price_per_1m": 2.33, + "output_price_per_1m": 13.98, + "currency": "EUR", + "provider_upstream": "Google", + "capabilities": [ + "vision", + "video", + "audio", + "files", + "tools", + "reasoning" + ] + } + ] + }, + { + "name": "Requesty", + "url": "https://requesty.ai", + "headquarters": "USA", + "region": "Global", + "gdpr_compliant": true, + "eu_endpoints": true, + "models": [ + { + "name": "novita/meta-llama/llama-3.2-1b-instruct", + "type": "chat", + "input_price_per_1m": 0.02, + "output_price_per_1m": 0.02, + "currency": "USD", + "context_window": 131000, + "size_b": 1 + }, + { + "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.02, + "output_price_per_1m": 0.05, + "currency": "USD", + "context_window": 131072, + "size_b": 8 + }, + { + "name": "openai/gpt-5-nano", + "type": "vision", + "input_price_per_1m": 0.025, + "output_price_per_1m": 0.2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "novita/meta-llama/llama-3.2-3b-instruct", + "type": "chat", + "input_price_per_1m": 0.03, + "output_price_per_1m": 0.05, + "currency": "USD", + "context_window": 32768, + "size_b": 3 + }, + { + "name": "novita/meta-llama/llama-3-8b-instruct", + "type": "chat", + "input_price_per_1m": 0.04, + "output_price_per_1m": 0.04, + "currency": "USD", + "context_window": 8192, + "size_b": 8, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct" + }, + { + "name": "novita/Sao10K/L3-8B-Stheno-v3.2", + "type": "chat", + "input_price_per_1m": 0.05, + "output_price_per_1m": 0.05, + "currency": "USD", + "context_window": 8192, + "size_b": 8 + }, + { + "name": "novita/meta-llama/llama-3.1-8b-instruct", + "type": "chat", + "input_price_per_1m": 0.05, + "output_price_per_1m": 0.05, + "currency": "USD", + "context_window": 16384, + "size_b": 8, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct" + }, + { + "name": "novita/sao10k/l3-8b-lunaris", + "type": "chat", + "input_price_per_1m": 0.05, + "output_price_per_1m": 0.05, + "currency": "USD", + "context_window": 8192, + "size_b": 8 + }, + { + "name": "openai-responses/gpt-5-nano", + "type": "vision", + "input_price_per_1m": 0.05, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "azure/gpt-5-nano", + "type": "vision", + "input_price_per_1m": 0.05, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "alibaba/qwen-turbo", + "type": "chat", + "input_price_per_1m": 0.05, + "output_price_per_1m": 0.2, + "currency": "USD", + "context_window": 1000000, + "capabilities": [ + "tools" + ] + }, + { + "name": "together/meta-llama/Llama-3.2-3B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.06, + "output_price_per_1m": 0.06, + "currency": "USD", + "context_window": 131072, + "size_b": 3 + }, + { + "name": "deepinfra/microsoft/phi-4", + "type": "chat", + "input_price_per_1m": 0.07, + "output_price_per_1m": 0.14, + "currency": "USD", + "context_window": 16384 + }, + { + "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct", + "type": "chat", + "input_price_per_1m": 0.07, + "output_price_per_1m": 0.16, + "currency": "USD", + "context_window": 16384, + "size_b": 32 + }, + { + "name": "novita/gryphe/mythomax-l2-13b", + "type": "chat", + "input_price_per_1m": 0.09, + "output_price_per_1m": 0.09, + "currency": "USD", + "context_window": 4096, + "size_b": 13 + }, + { + "name": "vertex/gemini-2.5-flash-lite", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "openai/gpt-4.1-nano", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "mistral/devstral-small-latest", + "type": "chat", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "mistralai/Devstral-Small-2507" + }, + { + "name": "mistral/mistral-small-2503", + "type": "chat", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 32768 + }, + { + "name": "mistral/devstral-small-2507", + "type": "chat", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "mistralai/Devstral-Small-2507" + }, + { + "name": "openai-responses/gpt-4.1-nano", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite", + "type": "chat", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.1, + "currency": "USD", + "context_window": 8192, + "size_b": 8 + }, + { + "name": "deepinfra/Qwen/Qwen3-32B", + "type": "chat", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 40000, + "size_b": 32, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "Qwen/Qwen3-32B" + }, + { + "name": "google/gemini-2.5-flash-lite", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "google/gemini-2.0-flash-001", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1048576 + }, + { + "name": "azure/openai-responses/gpt-4.1-nano", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "azure/gpt-4.1-nano", + "type": "vision", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "groq/openai/gpt-oss-20b", + "type": "chat", + "input_price_per_1m": 0.1, + "output_price_per_1m": 0.5, + "currency": "USD", + "context_window": 131072, + "size_b": 20, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "openai/gpt-oss-20b" + }, + { + "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.12, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 131072, + "size_b": 70, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Llama-3.3-70B-Instruct" + }, + { + "name": "openai/gpt-5-mini", + "type": "vision", + "input_price_per_1m": 0.125, + "output_price_per_1m": 1, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "nebius/meta-llama/Llama-3.3-70B-Instruct", + "type": "chat", + "input_price_per_1m": 0.13, + "output_price_per_1m": 0.4, + "currency": "USD", + "context_window": 128000, + "size_b": 70, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Llama-3.3-70B-Instruct" + }, + { + "name": "novita/nousresearch/hermes-2-pro-llama-3-8b", + "type": "chat", + "input_price_per_1m": 0.14, + "output_price_per_1m": 0.14, + "currency": "USD", + "context_window": 8192, + "size_b": 8 + }, + { + "name": "novita/deepseek/deepseek-r1-distill-qwen-14b", + "type": "chat", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.15, + "currency": "USD", + "context_window": 128000, + "size_b": 14, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1" + }, + { + "name": "openai/gpt-4o-mini", + "type": "vision", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.6, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 128000 + }, + { + "name": "mistral/mistral-small-latest", + "type": "vision", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.6, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 256000 + }, + { + "name": "mistral/mistral-small-2603", + "type": "vision", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.6, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 256000, + "size_b": 119, + "hf_id": "mistralai/Mistral-Small-4-119B-2603" + }, + { + "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507", + "type": "chat", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.85, + "currency": "USD", + "context_window": 262144, + "size_b": 235 + }, + { + "name": "nebius/openai/gpt-oss-120b", + "type": "chat", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.6, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 131000, + "size_b": 120, + "hf_id": "openai/gpt-oss-120b" + }, + { + "name": "groq/openai/gpt-oss-120b", + "type": "chat", + "input_price_per_1m": 0.15, + "output_price_per_1m": 0.75, + "currency": "USD", + "context_window": 131072, + "size_b": 120, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "openai/gpt-oss-120b" + }, + { + "name": "novita/mistralai/mistral-nemo", + "type": "chat", + "input_price_per_1m": 0.17, + "output_price_per_1m": 0.17, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "mistralai/Mistral-Nemo-Instruct-2407" + }, + { + "name": "together/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.18, + "output_price_per_1m": 0.18, + "currency": "USD", + "context_window": 131072, + "size_b": 8 + }, + { + "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.85, + "currency": "USD", + "context_window": 1048576, + "size_b": 17, + "capabilities": [ + "vision", + "tools" + ], + "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct" + }, + { + "name": "novita/qwen/qwen3-235b-a22b-fp8", + "type": "chat", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.8, + "currency": "USD", + "context_window": 128000, + "size_b": 235, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "Qwen/Qwen3-235B-A22B" + }, + { + "name": "openai/gpt-5.4-nano", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 1.25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5.4-nano", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 1.25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "xai/grok-4-fast-non-reasoning", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.5, + "currency": "USD", + "context_window": 2000000, + "capabilities": [ + "vision", + "tools", + "reasoning" + ] + }, + { + "name": "xai/grok-4-1-fast-non-reasoning", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 2000000 + }, + { + "name": "xai/grok-code-fast-1", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 1.5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 256000 + }, + { + "name": "xai/grok-4-fast", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.5, + "currency": "USD", + "context_window": 2000000, + "capabilities": [ + "vision", + "tools", + "reasoning" + ] + }, + { + "name": "xai/grok-4-1-fast-reasoning", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 2000000 + }, + { + "name": "together/meta-llama/LlamaGuard-2-8b", + "type": "chat", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.2, + "currency": "USD", + "context_window": 8192, + "size_b": 8 + }, + { + "name": "deepinfra/zai-org/GLM-4.5-Air", + "type": "chat", + "input_price_per_1m": 0.2, + "output_price_per_1m": 1.1, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "zai-org/GLM-4.5-Air", + "size_b": 110.5 + }, + { + "name": "deepinfra/Qwen/Qwen3-235B-A22B", + "type": "chat", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.6, + "currency": "USD", + "context_window": 40000, + "size_b": 235, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "Qwen/Qwen3-235B-A22B" + }, + { + "name": "alibaba/qwen3-30b-a3b-instruct-2507", + "type": "vision", + "input_price_per_1m": 0.2, + "output_price_per_1m": 0.8, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 131072, + "size_b": 30, + "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507" + }, + { + "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "type": "chat", + "input_price_per_1m": 0.23, + "output_price_per_1m": 0.69, + "currency": "USD", + "context_window": 64000, + "size_b": 70, + "capabilities": [ + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B" + }, + { + "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct", + "type": "chat", + "input_price_per_1m": 0.23, + "output_price_per_1m": 0.4, + "currency": "USD", + "context_window": 130815, + "size_b": 70 + }, + { + "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct", + "type": "vision", + "input_price_per_1m": 0.23, + "output_price_per_1m": 0.4, + "currency": "USD", + "context_window": 131072, + "size_b": 72, + "capabilities": [ + "vision" + ], + "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct" + }, + { + "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct", + "type": "chat", + "input_price_per_1m": 0.23, + "output_price_per_1m": 0.4, + "currency": "USD", + "context_window": 131072, + "size_b": 70, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Llama-3.3-70B-Instruct" + }, + { + "name": "vertex/gemini-3.1-flash-lite-preview", + "type": "vision", + "input_price_per_1m": 0.25, + "output_price_per_1m": 1.5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1048576 + }, + { + "name": "mistral/open-mistral-7b", + "type": "chat", + "input_price_per_1m": 0.25, + "output_price_per_1m": 0.25, + "currency": "USD", + "context_window": 32768, + "size_b": 7 + }, + { + "name": "openai-responses/gpt-5-mini", + "type": "vision", + "input_price_per_1m": 0.25, + "output_price_per_1m": 2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "google/gemini-3.1-flash-lite-preview", + "type": "vision", + "input_price_per_1m": 0.25, + "output_price_per_1m": 1.5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1048576 + }, + { + "name": "azure/gpt-5-mini", + "type": "vision", + "input_price_per_1m": 0.25, + "output_price_per_1m": 2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "novita/deepseek/deepseek-v3.2", + "type": "chat", + "input_price_per_1m": 0.269, + "output_price_per_1m": 0.4, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 163840, + "hf_id": "deepseek-ai/DeepSeek-V3.2" + }, + { + "name": "deepseek/deepseek-chat", + "type": "chat", + "input_price_per_1m": 0.28, + "output_price_per_1m": 0.42, + "currency": "USD", + "context_window": 128000, + "capabilities": [ + "tools" + ], + "hf_id": "deepseek-ai/DeepSeek-V3" + }, + { + "name": "deepseek/deepseek-reasoner", + "type": "chat", + "input_price_per_1m": 0.28, + "output_price_per_1m": 0.42, + "currency": "USD", + "context_window": 128000 + }, + { + "name": "novita/minimax-m2.7", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.7" + }, + { + "name": "novita/deepseek/deepseek-r1-distill-qwen-32b", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 12800, + "size_b": 32, + "capabilities": [ + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B" + }, + { + "name": "novita/MiniMax-M2.7", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.7" + }, + { + "name": "vertex/gemini-2.5-flash", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 2.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "vertex/gemini-2.5-flash-image", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 2.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "coding/gemini-2.5-flash", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 2.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "mistral/codestral-latest", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 0.9, + "currency": "USD", + "context_window": 131072 + }, + { + "name": "xai/grok-3-mini", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 0.5, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 131072 + }, + { + "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 0.3, + "currency": "USD", + "context_window": 32768, + "size_b": 7 + }, + { + "name": "deepinfra/deepseek-ai/DeepSeek-V3.1", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1, + "currency": "USD", + "context_window": 163840, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus" + }, + { + "name": "parasail/parasail-gemma3-27b-it", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 0.5, + "currency": "USD", + "context_window": 128000, + "size_b": 27 + }, + { + "name": "google/gemini-2.5-flash", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 2.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "nebius/deepseek-ai/DeepSeek-V3.2", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 0.45, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 164000, + "hf_id": "deepseek-ai/DeepSeek-V3.2" + }, + { + "name": "nebius/minimax/minimax-m2.1", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.1" + }, + { + "name": "minimaxi/MiniMax-M2.7", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.7" + }, + { + "name": "minimaxi/MiniMax-M2", + "type": "chat", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.2, + "currency": "USD", + "context_window": 200000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "MiniMaxAI/MiniMax-M2" + }, + { + "name": "minimaxi/MiniMax-M2.5", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.5" + }, + { + "name": "alibaba/qwen3-coder-flash", + "type": "vision", + "input_price_per_1m": 0.3, + "output_price_per_1m": 1.5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1048576 + }, + { + "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct", + "type": "chat", + "input_price_per_1m": 0.35, + "output_price_per_1m": 0.4, + "currency": "USD", + "context_window": 131072, + "size_b": 90 + }, + { + "name": "novita/qwen/qwen-2.5-72b-instruct", + "type": "chat", + "input_price_per_1m": 0.38, + "output_price_per_1m": 0.4, + "currency": "USD", + "context_window": 32000, + "size_b": 72, + "capabilities": [ + "tools" + ], + "hf_id": "Qwen/Qwen2.5-72B-Instruct" + }, + { + "name": "novita/meta-llama/llama-3.3-70b-instruct", + "type": "chat", + "input_price_per_1m": 0.39, + "output_price_per_1m": 0.39, + "currency": "USD", + "context_window": 131072, + "size_b": 70, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Llama-3.3-70B-Instruct" + }, + { + "name": "novita/deepseek/deepseek-v3-0324", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.3, + "currency": "USD", + "context_window": 128000, + "capabilities": [ + "tools", + "reasoning" + ], + "size_b": 685, + "hf_id": "deepseek-ai/DeepSeek-V3-0324" + }, + { + "name": "novita/deepseek/deepseek-v3-turbo", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.3, + "currency": "USD", + "context_window": 128000 + }, + { + "name": "openai/gpt-4.1-mini", + "type": "vision", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.6, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "mistral/devstral-latest", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 2, + "currency": "USD", + "context_window": 256000 + }, + { + "name": "mistral/devstral-medium-2507", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 2, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ] + }, + { + "name": "mistral/mistral-medium-latest", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 2, + "currency": "USD", + "context_window": 131072 + }, + { + "name": "openai-responses/gpt-4.1-mini", + "type": "vision", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.6, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.6, + "currency": "USD", + "context_window": 262144, + "size_b": 480, + "capabilities": [ + "tools" + ], + "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct" + }, + { + "name": "azure/gpt-4.1-mini", + "type": "vision", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.6, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "azure/openai-responses/gpt-4.1-mini", + "type": "vision", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.6, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "nebius/zai-org/GLM-4.7", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000, + "hf_id": "zai-org/GLM-4.7" + }, + { + "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.8, + "currency": "USD", + "context_window": 262000, + "size_b": 480, + "capabilities": [ + "tools" + ], + "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct" + }, + { + "name": "alibaba/qwen-plus", + "type": "chat", + "input_price_per_1m": 0.4, + "output_price_per_1m": 1.2, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ] + }, + { + "name": "vertex/gemini-3.1-flash-image-preview", + "type": "vision", + "input_price_per_1m": 0.5, + "output_price_per_1m": 2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 131072 + }, + { + "name": "vertex/gemini-3-flash-preview", + "type": "vision", + "input_price_per_1m": 0.5, + "output_price_per_1m": 3, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "mistral/mistral-large-latest", + "type": "chat", + "input_price_per_1m": 0.5, + "output_price_per_1m": 1.5, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ] + }, + { + "name": "google/gemini-3.1-flash-image-preview", + "type": "vision", + "input_price_per_1m": 0.5, + "output_price_per_1m": 2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 131072 + }, + { + "name": "google/gemini-3-flash-preview", + "type": "vision", + "input_price_per_1m": 0.5, + "output_price_per_1m": 3, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "nebius/moonshotai/Kimi-K2-Instruct", + "type": "chat", + "input_price_per_1m": 0.5, + "output_price_per_1m": 2.4, + "currency": "USD", + "context_window": 131000, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "nebius/deepseek-ai/DeepSeek-V3-0324", + "type": "chat", + "input_price_per_1m": 0.5, + "output_price_per_1m": 1.5, + "currency": "USD", + "context_window": 128000, + "capabilities": [ + "tools", + "reasoning" + ], + "size_b": 685, + "hf_id": "deepseek-ai/DeepSeek-V3-0324" + }, + { + "name": "nebius/moonshotai/kimi-k2.5", + "type": "vision", + "input_price_per_1m": 0.5, + "output_price_per_1m": 2.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 256000, + "hf_id": "moonshotai/Kimi-K2.5", + "size_b": 1058.6 + }, + { + "name": "novita/meta-llama/llama-3-70b-instruct", + "type": "chat", + "input_price_per_1m": 0.51, + "output_price_per_1m": 0.74, + "currency": "USD", + "context_window": 8192, + "size_b": 70, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Llama-3.3-70B-Instruct" + }, + { + "name": "openai/o4-mini", + "type": "vision", + "input_price_per_1m": 0.55, + "output_price_per_1m": 2.2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "vertex/deepseek-v3.2", + "type": "vision", + "input_price_per_1m": 0.56, + "output_price_per_1m": 1.68, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 163840, + "hf_id": "deepseek-ai/DeepSeek-V3.2" + }, + { + "name": "novita/moonshotai/kimi-k2-instruct", + "type": "chat", + "input_price_per_1m": 0.57, + "output_price_per_1m": 2.3, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "novita/zai-org/glm-4.6", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "context_window": 204800, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "zai-org/GLM-4.6" + }, + { + "name": "novita/zai-org/glm-4.5", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "zai-org/GLM-4.5" + }, + { + "name": "zai/GLM-4.5", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 131072, + "hf_id": "zai-org/GLM-4.5" + }, + { + "name": "zai/GLM-4.6", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000, + "hf_id": "zai-org/GLM-4.6" + }, + { + "name": "zai/GLM-4.7", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000, + "hf_id": "zai-org/GLM-4.7" + }, + { + "name": "moonshot/kimi-k2-0711-preview", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "moonshot/kimi-k2.5", + "type": "vision", + "input_price_per_1m": 0.6, + "output_price_per_1m": 3, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 262144, + "hf_id": "moonshotai/Kimi-K2.5", + "size_b": 1058.6 + }, + { + "name": "moonshot/kimi-k2-thinking-turbo", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "moonshotai/Kimi-K2-Thinking" + }, + { + "name": "moonshot/kimi-k2-0905-preview", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct-0905" + }, + { + "name": "moonshot/kimi-k2-thinking", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "deepinfra/zai-org/GLM-4.5", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "zai-org/GLM-4.5" + }, + { + "name": "nebius/zai-org/GLM-4.5", + "type": "chat", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.2, + "currency": "USD", + "context_window": 128000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "zai-org/GLM-4.5" + }, + { + "name": "minimaxi/MiniMax-M2.7-highspeed", + "type": "vision", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.4, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.7" + }, + { + "name": "minimaxi/MiniMax-M2.5-highspeed", + "type": "vision", + "input_price_per_1m": 0.6, + "output_price_per_1m": 2.4, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "MiniMaxAI/MiniMax-M2.5" + }, + { + "name": "alibaba/qwen3.5", + "type": "vision", + "input_price_per_1m": 0.6, + "output_price_per_1m": 3.6, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 256000, + "size_b": 9, + "hf_id": "Qwen/Qwen3.5-9B" + }, + { + "name": "novita/microsoft/wizardlm-2-8x22b", + "type": "chat", + "input_price_per_1m": 0.62, + "output_price_per_1m": 0.62, + "currency": "USD", + "context_window": 65535, + "size_b": 22 + }, + { + "name": "openai/gpt-5", + "type": "vision", + "input_price_per_1m": 0.625, + "output_price_per_1m": 5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "novita/deepseek/deepseek-prover-v2-671b", + "type": "chat", + "input_price_per_1m": 0.7, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 160000, + "size_b": 671 + }, + { + "name": "novita/deepseek/deepseek-r1-turbo", + "type": "chat", + "input_price_per_1m": 0.7, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 64000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1" + }, + { + "name": "parasail/parasail-qwen25-vl-72b-instruct", + "type": "vision", + "input_price_per_1m": 0.7, + "output_price_per_1m": 0.7, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 32768, + "size_b": 72 + }, + { + "name": "openai/gpt-5.4-mini", + "type": "vision", + "input_price_per_1m": 0.75, + "output_price_per_1m": 4.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5.4-mini", + "type": "vision", + "input_price_per_1m": 0.75, + "output_price_per_1m": 4.5, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "novita/deepseek/deepseek-r1-distill-llama-70b", + "type": "chat", + "input_price_per_1m": 0.8, + "output_price_per_1m": 0.8, + "currency": "USD", + "context_window": 32000, + "size_b": 70, + "capabilities": [ + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B" + }, + { + "name": "novita/qwen/qwen2.5-vl-72b-instruct", + "type": "vision", + "input_price_per_1m": 0.8, + "output_price_per_1m": 0.8, + "currency": "USD", + "context_window": 96000, + "size_b": 72, + "capabilities": [ + "vision" + ], + "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct" + }, + { + "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct", + "type": "chat", + "input_price_per_1m": 0.8, + "output_price_per_1m": 0.8, + "currency": "USD", + "context_window": 130815, + "size_b": 405 + }, + { + "name": "nebius/deepseek-ai/DeepSeek-R1-0528", + "type": "chat", + "input_price_per_1m": 0.8, + "output_price_per_1m": 2.4, + "currency": "USD", + "context_window": 164000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1-0528" + }, + { + "name": "deepinfra/deepseek-ai/DeepSeek-R1", + "type": "chat", + "input_price_per_1m": 0.85, + "output_price_per_1m": 2.5, + "currency": "USD", + "context_window": 64000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1" + }, + { + "name": "deepinfra/deepseek-ai/DeepSeek-V3", + "type": "chat", + "input_price_per_1m": 0.85, + "output_price_per_1m": 0.9, + "currency": "USD", + "context_window": 128000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus" + }, + { + "name": "alibaba/qwen3-max", + "type": "vision", + "input_price_per_1m": 0.861, + "output_price_per_1m": 3.441, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 262144 + }, + { + "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.88, + "output_price_per_1m": 0.88, + "currency": "USD", + "context_window": 131072, + "size_b": 70, + "capabilities": [ + "tools" + ], + "hf_id": "meta-llama/Llama-3.3-70B-Instruct" + }, + { + "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 0.88, + "output_price_per_1m": 0.88, + "currency": "USD", + "context_window": 131072, + "size_b": 70 + }, + { + "name": "novita/deepseek/deepseek_v3", + "type": "chat", + "input_price_per_1m": 0.89, + "output_price_per_1m": 0.89, + "currency": "USD", + "context_window": 64000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus" + }, + { + "name": "parasail/parasail-kimi-k2-instruct", + "type": "chat", + "input_price_per_1m": 0.99, + "output_price_per_1m": 2.99, + "currency": "USD", + "context_window": 131072 + }, + { + "name": "perplexity/sonar", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 1, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "vision" + ] + }, + { + "name": "bedrock/claude-haiku-4-5", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 200000 + }, + { + "name": "novita/GLM-5", + "type": "chat", + "input_price_per_1m": 1, + "output_price_per_1m": 3.2, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 202800, + "hf_id": "zai-org/GLM-5" + }, + { + "name": "vertex/claude-haiku-4-5", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 200000 + }, + { + "name": "openai/o3", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 4, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "zai/GLM-5", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 3.2, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000, + "hf_id": "zai-org/GLM-5" + }, + { + "name": "anthropic/claude-haiku-4-5", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 200000 + }, + { + "name": "alibaba/qwen3-coder-plus", + "type": "vision", + "input_price_per_1m": 1, + "output_price_per_1m": 5, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1048576 + }, + { + "name": "groq/moonshotai/Kimi-K2-Instruct-0905", + "type": "chat", + "input_price_per_1m": 1, + "output_price_per_1m": 3, + "currency": "USD", + "context_window": 256000, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "groq/moonshotai/kimi-k2-instruct", + "type": "chat", + "input_price_per_1m": 1, + "output_price_per_1m": 3, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "openai/o3-mini", + "type": "chat", + "input_price_per_1m": 1.1, + "output_price_per_1m": 4.4, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "openai-responses/o4-mini", + "type": "vision", + "input_price_per_1m": 1.1, + "output_price_per_1m": 4.4, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "openai-responses/o3-mini", + "type": "chat", + "input_price_per_1m": 1.1, + "output_price_per_1m": 4.4, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "azure/o4-mini", + "type": "vision", + "input_price_per_1m": 1.1, + "output_price_per_1m": 4.4, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "moonshot/kimi-k2-turbo-preview", + "type": "chat", + "input_price_per_1m": 1.2, + "output_price_per_1m": 5, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ], + "hf_id": "moonshotai/Kimi-K2-Instruct" + }, + { + "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo", + "type": "chat", + "input_price_per_1m": 1.2, + "output_price_per_1m": 1.2, + "currency": "USD", + "context_window": 32768, + "size_b": 72 + }, + { + "name": "vertex/gemini-2.5-pro", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "openai/gpt-5-chat", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 128000 + }, + { + "name": "openai/gpt-5.1", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai/gpt-5.1-chat", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 128000 + }, + { + "name": "coding/gemini-2.5-pro", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "openai-responses/gpt-5", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5.1", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5.1-codex", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5-codex", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "together/deepseek-ai/DeepSeek-V3", + "type": "chat", + "input_price_per_1m": 1.25, + "output_price_per_1m": 1.25, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus" + }, + { + "name": "google/gemini-2.5-pro", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "azure/gpt-5", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "azure/gpt-5.1", + "type": "vision", + "input_price_per_1m": 1.25, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "novita/sao10k/l31-70b-euryale-v2.2", + "type": "chat", + "input_price_per_1m": 1.48, + "output_price_per_1m": 1.48, + "currency": "USD", + "context_window": 16000, + "size_b": 70 + }, + { + "name": "novita/sao10k/l3-70b-euryale-v2.1", + "type": "chat", + "input_price_per_1m": 1.48, + "output_price_per_1m": 1.48, + "currency": "USD", + "context_window": 16000, + "size_b": 70 + }, + { + "name": "alibaba/qwen-max", + "type": "chat", + "input_price_per_1m": 1.6, + "output_price_per_1m": 6.4, + "currency": "USD", + "context_window": 32768, + "capabilities": [ + "tools" + ] + }, + { + "name": "openai/gpt-5.3-chat", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 128000 + }, + { + "name": "openai/gpt-5.2", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai/gpt-5.2-chat", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 128000 + }, + { + "name": "openai-responses/gpt-5.2-codex", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5.3-codex", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "openai-responses/gpt-5.3-chat", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 128000 + }, + { + "name": "openai-responses/gpt-5.2", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "azure/gpt-5.3-codex", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "azure/openai-responses/gpt-5.2-codex", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 400000 + }, + { + "name": "azure/gpt-5.2", + "type": "vision", + "input_price_per_1m": 1.75, + "output_price_per_1m": 14, + "currency": "USD", + "capabilities": [ + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "perplexity/sonar-reasoning-pro", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 8, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "vision", + "reasoning" + ] + }, + { + "name": "vertex/gemini-3.1-pro-preview", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 12, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "vertex/gemini-3-pro-preview", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 12, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "vertex/gemini-3-pro-image-preview", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 12, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "openai/gpt-4.1", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 8, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "openai/o4-mini-deep-research", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 8, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 100000 + }, + { + "name": "mistral/pixtral-large-latest", + "type": "chat", + "input_price_per_1m": 2, + "output_price_per_1m": 5, + "currency": "USD", + "context_window": 131072 + }, + { + "name": "openai-responses/gpt-4.1", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 8, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "xai/grok-2-1212", + "type": "chat", + "input_price_per_1m": 2, + "output_price_per_1m": 10, + "currency": "USD", + "context_window": 131072 + }, + { + "name": "xai/grok-4.2-beta", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 6, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 2000000 + }, + { + "name": "google/gemini-3-pro-preview", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 12, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "google/gemini-3.1-pro-preview", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 12, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1048576 + }, + { + "name": "azure/openai-responses/gpt-4.1", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 8, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "azure/gpt-4.1", + "type": "vision", + "input_price_per_1m": 2, + "output_price_per_1m": 8, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 1047576 + }, + { + "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast", + "type": "chat", + "input_price_per_1m": 2, + "output_price_per_1m": 6, + "currency": "USD", + "context_window": 128000 + }, + { + "name": "openai/gpt-4o-2024-11-20", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 128000 + }, + { + "name": "openai/gpt-4o-2024-08-06", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 128000 + }, + { + "name": "openai/gpt-4o-2024-05-13", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 128000 + }, + { + "name": "openai/gpt-5.4", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1050000 + }, + { + "name": "openai/gpt-4o", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 10, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 128000 + }, + { + "name": "openai-responses/gpt-5.4", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1050000 + }, + { + "name": "azure/openai-responses/gpt-5.4", + "type": "vision", + "input_price_per_1m": 2.5, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1050000 + }, + { + "name": "perplexity/sonar-pro", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "context_window": 204800, + "capabilities": [ + "vision" + ] + }, + { + "name": "bedrock/claude-sonnet-4-5", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "bedrock/claude-sonnet-4-6", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "bedrock/claude-sonnet-4", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "bedrock/claude-3-7-sonnet", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "vertex/claude-sonnet-4-5", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "vertex/claude-sonnet-4", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "vertex/claude-3-7-sonnet", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "vertex/claude-3-5-sonnet", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 200000 + }, + { + "name": "coding/claude-sonnet-4-20250514", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "anthropic/claude-sonnet-4-5", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "anthropic/claude-sonnet-4-6", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "anthropic/claude-sonnet-4", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "xai/grok-4", + "type": "vision", + "input_price_per_1m": 3, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 256000 + }, + { + "name": "together/deepseek-ai/DeepSeek-R1", + "type": "chat", + "input_price_per_1m": 3, + "output_price_per_1m": 7, + "currency": "USD", + "context_window": 64000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1" + }, + { + "name": "novita/deepseek/deepseek-r1", + "type": "chat", + "input_price_per_1m": 4, + "output_price_per_1m": 4, + "currency": "USD", + "context_window": 64000, + "capabilities": [ + "tools", + "reasoning" + ], + "hf_id": "deepseek-ai/DeepSeek-R1" + }, + { + "name": "bedrock/claude-opus-4-5", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "bedrock/claude-opus-4-6", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "vertex/claude-opus-4-6", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "vertex/claude-opus-4-5", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "openai/chatgpt-4o", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 15, + "currency": "USD", + "capabilities": [ + "vision" + ], + "context_window": 128000 + }, + { + "name": "anthropic/claude-opus-4-6", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 1000000 + }, + { + "name": "anthropic/claude-opus-4-5", + "type": "vision", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "xai/grok-3", + "type": "chat", + "input_price_per_1m": 5, + "output_price_per_1m": 25, + "currency": "USD", + "context_window": 131072, + "capabilities": [ + "tools" + ] + }, + { + "name": "openai/o3-deep-research", + "type": "vision", + "input_price_per_1m": 10, + "output_price_per_1m": 40, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 100000 + }, + { + "name": "bedrock/claude-opus-4", + "type": "vision", + "input_price_per_1m": 15, + "output_price_per_1m": 75, + "currency": "USD", + "capabilities": [ + "vision", + "reasoning" + ], + "context_window": 200000 + }, + { + "name": "vertex/claude-opus-4", "type": "vision", - "input_price_per_1m": 0.23, - "output_price_per_1m": 1.86, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 75, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "reasoning", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT-5", + "name": "vertex/claude-opus-4-1", "type": "vision", - "input_price_per_1m": 1.16, - "output_price_per_1m": 9.32, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 75, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "reasoning", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT-4o Mini", + "name": "openai/o1", "type": "vision", - "input_price_per_1m": 0.14, - "output_price_per_1m": 0.56, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 60, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT-4.1 nano", + "name": "coding/claude-opus-4-20250514", "type": "vision", - "input_price_per_1m": 0.09, - "output_price_per_1m": 0.37, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 75, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT-4o", + "name": "anthropic/claude-opus-4-1", "type": "vision", - "input_price_per_1m": 2.56, - "output_price_per_1m": 10.25, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 75, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT-4.1", + "name": "anthropic/claude-opus-4", "type": "vision", - "input_price_per_1m": 1.86, - "output_price_per_1m": 7.45, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 75, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT-4.1 mini", + "name": "openai-responses/gpt-5-pro", "type": "vision", - "input_price_per_1m": 0.37, - "output_price_per_1m": 1.49, - "currency": "EUR", - "provider_upstream": "OpenAI", + "input_price_per_1m": 15, + "output_price_per_1m": 120, + "currency": "USD", "capabilities": [ "vision", - "files", - "tools", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 400000 }, { - "name": "Gemini 3 Flash Preview", + "name": "openai-responses/o3-pro", "type": "vision", - "input_price_per_1m": 0.47, - "output_price_per_1m": 2.8, - "currency": "EUR", - "provider_upstream": "Google", + "input_price_per_1m": 20, + "output_price_per_1m": 80, + "currency": "USD", "capabilities": [ "vision", - "video", - "audio", - "files", - "tools", - "reasoning", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 }, { - "name": "GPT oss (120b)", - "type": "chat", - "input_price_per_1m": 0.28, - "output_price_per_1m": 2.33, - "currency": "EUR", - "size_b": 120, - "provider_upstream": "OpenAI", + "name": "openai/gpt-5.4-pro", + "type": "vision", + "input_price_per_1m": 30, + "output_price_per_1m": 180, + "currency": "USD", "capabilities": [ - "tools", - "reasoning", - "eu-endpoint" + "vision", + "reasoning" ], - "hf_id": "openai/gpt-oss-120b" + "context_window": 1050000 }, { - "name": "Gemini 2.5 Flash", + "name": "openai-responses/gpt-5.4-pro", "type": "vision", - "input_price_per_1m": 0.28, - "output_price_per_1m": 2.33, - "currency": "EUR", - "provider_upstream": "Google", + "input_price_per_1m": 30, + "output_price_per_1m": 180, + "currency": "USD", "capabilities": [ "vision", - "video", - "audio", - "files", - "tools", - "reasoning", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 1050000 }, { - "name": "Gemini 2.5 Pro Reasoning", + "name": "azure/openai-responses/gpt-5.4-pro", "type": "vision", - "input_price_per_1m": 2.33, - "output_price_per_1m": 13.98, - "currency": "EUR", - "provider_upstream": "Google", + "input_price_per_1m": 30, + "output_price_per_1m": 180, + "currency": "USD", "capabilities": [ "vision", - "video", - "audio", - "files", - "tools", - "reasoning", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 1050000 }, { - "name": "Gemini 2.5 Pro", + "name": "openai/o1-pro", "type": "vision", - "input_price_per_1m": 2.33, - "output_price_per_1m": 13.98, - "currency": "EUR", - "provider_upstream": "Google", + "input_price_per_1m": 150, + "output_price_per_1m": 600, + "currency": "USD", "capabilities": [ "vision", - "video", - "audio", - "files", - "tools", - "reasoning", - "eu-endpoint" - ] + "reasoning" + ], + "context_window": 200000 } - ] - }, - { - "name": "Requesty", - "url": "https://requesty.ai", - "headquarters": "USA", - "region": "Global", - "gdpr_compliant": true, - "eu_endpoints": true, - "models": [], + ], "lastUpdated": "2026-03-02T04:53:24.807Z" }, { @@ -1042,8 +3869,7 @@ "flavor": "base", "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-120b" }, @@ -1057,8 +3883,7 @@ "flavor": "base", "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-20b" }, @@ -1072,8 +3897,7 @@ "capabilities": [ "tools" ], - "hf_id": "moonshotai/Kimi-K2-Instruct", - "size_b": 1026.5 + "hf_id": "moonshotai/Kimi-K2-Instruct" }, { "name": "Qwen3-Coder-480B-A35B-Instruct (base)", @@ -1084,8 +3908,7 @@ "size_b": 480, "flavor": "base", "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct" }, @@ -1153,8 +3976,7 @@ "size_b": 30, "flavor": "base", "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "Qwen/Qwen3-Coder-30B-A3B-Instruct" }, @@ -1271,8 +4093,7 @@ "tools", "reasoning" ], - "hf_id": "zai-org/GLM-4.5", - "size_b": 358.3 + "hf_id": "zai-org/GLM-4.5" }, { "name": "GLM-4.5-Air (base)", @@ -1299,8 +4120,7 @@ "tools", "reasoning" ], - "hf_id": "deepseek-ai/DeepSeek-R1-0528", - "size_b": 684.5 + "hf_id": "deepseek-ai/DeepSeek-R1-0528" }, { "name": "DeepSeek-R1-0528 (base)", @@ -1313,8 +4133,7 @@ "tools", "reasoning" ], - "hf_id": "deepseek-ai/DeepSeek-R1-0528", - "size_b": 684.5 + "hf_id": "deepseek-ai/DeepSeek-R1-0528" }, { "name": "DeepSeek-V3-0324 (fast)", @@ -1349,8 +4168,7 @@ "size_b": 70, "flavor": "fast", "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "meta-llama/Llama-3.3-70B-Instruct" }, @@ -1363,8 +4181,7 @@ "size_b": 70, "flavor": "base", "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "meta-llama/Llama-3.3-70B-Instruct" }, @@ -1645,8 +4462,7 @@ "size_b": 120, "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-120b" }, @@ -1694,8 +4510,7 @@ "currency": "EUR", "size_b": 70, "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "meta-llama/Llama-3.3-70B-Instruct" }, @@ -1720,8 +4535,7 @@ "currency": "EUR", "size_b": 30, "capabilities": [ - "tools", - "eu-endpoint" + "tools" ], "hf_id": "Qwen/Qwen3-Coder-30B-A3B-Instruct" }, @@ -2136,8 +4950,7 @@ "input_price_per_1m": 0.017, "output_price_per_1m": 0.11, "currency": "USD", - "hf_id": "ibm-granite/granite-4.0-h-micro", - "size_b": 3.2 + "hf_id": "ibm-granite/granite-4.0-h-micro" }, { "name": "google/gemma-3n-e4b-it", @@ -2464,8 +5277,7 @@ "capabilities": [ "tools", "reasoning" - ], - "size_b": 31.2 + ] }, { "name": "qwen/qwen3-14b", @@ -2715,8 +5527,7 @@ "capabilities": [ "tools", "reasoning" - ], - "size_b": 309.8 + ] }, { "name": "alibaba/tongyi-deepresearch-30b-a3b", @@ -2806,8 +5617,7 @@ "capabilities": [ "tools", "reasoning" - ], - "size_b": 199.4 + ] }, { "name": "mistralai/mistral-small-creative", @@ -3031,8 +5841,7 @@ "hf_id": "Qwen/Qwen3-Coder-Next", "capabilities": [ "tools" - ], - "size_b": 79.7 + ] }, { "name": "allenai/olmo-3-7b-think", @@ -4261,8 +7070,7 @@ "capabilities": [ "tools", "reasoning" - ], - "size_b": 684.5 + ] }, { "name": "undi95/remm-slerp-l2-13b", @@ -4453,8 +7261,7 @@ "capabilities": [ "tools", "reasoning" - ], - "size_b": 358.3 + ] }, { "name": "nvidia/llama-3.1-nemotron-ultra-253b-v1", @@ -5926,8 +8733,7 @@ "capabilities": [ "tools", "reasoning" - ], - "size_b": 199.4 + ] }, { "name": "arcee-ai/trinity-large-preview:free", @@ -6189,8 +8995,7 @@ "size_b": 20, "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-20b" }, @@ -6216,8 +9021,7 @@ "size_b": 120, "capabilities": [ "tools", - "reasoning", - "eu-endpoint" + "reasoning" ], "hf_id": "openai/gpt-oss-120b" }, @@ -6241,8 +9045,7 @@ "size_b": 17, "capabilities": [ "vision", - "tools", - "eu-endpoint" + "tools" ], "hf_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct" },