| |
| |
| |
|
|
| model_list: |
| |
| - model_name: gpt-4o-mini-northflank |
| litellm_params: |
| model: openai/gpt-4o-mini |
| api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
| api_key: os.environ/NF_API_KEY |
| - model_name: gpt-4o-mini |
| litellm_params: |
| model: openai/gpt-4o-mini |
| api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
| api_key: os.environ/NF_API_KEY |
| - model_name: gpt-3.5-turbo-northflank |
| litellm_params: |
| model: openai/gpt-3.5-turbo |
| api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
| api_key: os.environ/NF_API_KEY |
| - model_name: gpt-3.5-turbo |
| litellm_params: |
| model: openai/gpt-3.5-turbo |
| api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
| api_key: os.environ/NF_API_KEY |
|
|
| - model_name: gemini-1.5-pro-k1 |
| litellm_params: |
| model: gemini/gemini-1.5-pro |
| api_key: os.environ/GEMINI_API_KEY1 |
| - model_name: gemini-1.5-pro |
| litellm_params: |
| model: gemini/gemini-1.5-pro |
| api_key: os.environ/GEMINI_API_KEY1 |
| rpm: 4 |
| tpm: 6400 |
|
|
| - model_name: gemini-1.5-flash-k1 |
| litellm_params: |
| model: gemini/gemini-1.5-flash |
| api_key: os.environ/GEMINI_API_KEY1 |
| - model_name: gemini-1.5-flash |
| litellm_params: |
| model: gemini/gemini-1.5-flash |
| api_key: os.environ/GEMINI_API_KEY1 |
| rpm: 30 |
| tpm: 2000000 |
|
|
| - model_name: gemini-1.5-pro-k2 |
| litellm_params: |
| model: gemini/gemini-1.5-pro |
| api_key: os.environ/GEMINI_API_KEY2 |
| - model_name: gemini-1.5-pro |
| litellm_params: |
| model: gemini/gemini-1.5-pro |
| api_key: os.environ/GEMINI_API_KEY |
| rpm: 4 |
| tpm: 6400 |
|
|
| - model_name: gemini-1.5-flash-k2 |
| litellm_params: |
| model: gemini/gemini-1.5-flash |
| api_key: os.environ/GEMINI_API_KEY2 |
| - model_name: gemini-1.5-flash |
| litellm_params: |
| model: gemini/gemini-1.5-flash |
| api_key: os.environ/GEMINI_API_KEY2 |
| rpm: 30 |
| tpm: 2000000 |
|
|
| litellm_settings: |
| |
| request_timeout: 20 |
| num_retries: 3 |
| fallbacks: [{"gemini-1.5-pro": ["gemini-1.5-flash"]}] |
| allowed_fails: 3 |
| cooldown_time: 30 |
| drop_params: true |
|
|
| general_settings: |
| master_key: os.environ/MASTER_KEY |
|
|
| router_settings: |
| fallbacks: [{"gpt-4o-mini": ["gemini-1.5-flash"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}] |
| model_group_alias: {"gpt-4": "gemini-1.5-pro"} |
| routing_strategy: simple-shuffle |