Spaces:
Sleeping
Sleeping
add more fallback models
Browse files
app.py
CHANGED
|
@@ -55,7 +55,6 @@ class BasicAgent:
|
|
| 55 |
"rpm": 5,
|
| 56 |
"tpm": 250_000,
|
| 57 |
},
|
| 58 |
-
"fallbacks": ["gemini/gemini-2.5-flash"],
|
| 59 |
},
|
| 60 |
{
|
| 61 |
"model_name": "gemini-family",
|
|
@@ -64,7 +63,6 @@ class BasicAgent:
|
|
| 64 |
"rpm": 10,
|
| 65 |
"tpm": 250_000,
|
| 66 |
},
|
| 67 |
-
"fallbacks": ["gemini/gemini-2.0-flash"]
|
| 68 |
},
|
| 69 |
{
|
| 70 |
"model_name": "gemini-family",
|
|
@@ -73,7 +71,6 @@ class BasicAgent:
|
|
| 73 |
"rpm": 15,
|
| 74 |
"tpm": 1_000_000,
|
| 75 |
},
|
| 76 |
-
"fallbacks": ["gemini/gemini-2.0-flash-lite"]
|
| 77 |
},
|
| 78 |
{
|
| 79 |
"model_name": "gemini-family",
|
|
@@ -83,11 +80,25 @@ class BasicAgent:
|
|
| 83 |
"tpm": 1_000_000,
|
| 84 |
},
|
| 85 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 86 |
],
|
| 87 |
client_kwargs={
|
| 88 |
"routing_strategy": "usage-based-routing-v2"
|
| 89 |
},
|
| 90 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 91 |
api_key=os.getenv("API_KEY"),
|
| 92 |
)
|
| 93 |
self.agent = CodeAgent(
|
|
|
|
| 55 |
"rpm": 5,
|
| 56 |
"tpm": 250_000,
|
| 57 |
},
|
|
|
|
| 58 |
},
|
| 59 |
{
|
| 60 |
"model_name": "gemini-family",
|
|
|
|
| 63 |
"rpm": 10,
|
| 64 |
"tpm": 250_000,
|
| 65 |
},
|
|
|
|
| 66 |
},
|
| 67 |
{
|
| 68 |
"model_name": "gemini-family",
|
|
|
|
| 71 |
"rpm": 15,
|
| 72 |
"tpm": 1_000_000,
|
| 73 |
},
|
|
|
|
| 74 |
},
|
| 75 |
{
|
| 76 |
"model_name": "gemini-family",
|
|
|
|
| 80 |
"tpm": 1_000_000,
|
| 81 |
},
|
| 82 |
},
|
| 83 |
+
{
|
| 84 |
+
"model_name": "gemini-family",
|
| 85 |
+
"litellm_params": {
|
| 86 |
+
"model": "gemini/gemini-2.5-flash-lite-preview-06-17",
|
| 87 |
+
"rpm": 15,
|
| 88 |
+
"tpm": 250_000,
|
| 89 |
+
},
|
| 90 |
+
},
|
| 91 |
],
|
| 92 |
client_kwargs={
|
| 93 |
"routing_strategy": "usage-based-routing-v2"
|
| 94 |
},
|
| 95 |
+
fallbacks=[
|
| 96 |
+
{"gemini-2.5-pro": "gemini-2.5-flash"},
|
| 97 |
+
{"gemini-2.5-flash": ["gemini-2.0-flash"]},
|
| 98 |
+
{"gemini-2.0-flash": ["gemini-2.0-flash-lite"]},
|
| 99 |
+
{"gemini-2.0-flash-lite": ["gemini-2.5-flash-lite-preview-06-17"]},
|
| 100 |
+
],
|
| 101 |
+
num_retries=1,
|
| 102 |
api_key=os.getenv("API_KEY"),
|
| 103 |
)
|
| 104 |
self.agent = CodeAgent(
|