petrov826 commited on
Commit
9d4b13b
·
verified ·
1 Parent(s): 95fed74

add more fallback models

Browse files
Files changed (1) hide show
  1. app.py +15 -4
app.py CHANGED
@@ -55,7 +55,6 @@ class BasicAgent:
55
  "rpm": 5,
56
  "tpm": 250_000,
57
  },
58
- "fallbacks": ["gemini/gemini-2.5-flash"],
59
  },
60
  {
61
  "model_name": "gemini-family",
@@ -64,7 +63,6 @@ class BasicAgent:
64
  "rpm": 10,
65
  "tpm": 250_000,
66
  },
67
- "fallbacks": ["gemini/gemini-2.0-flash"]
68
  },
69
  {
70
  "model_name": "gemini-family",
@@ -73,7 +71,6 @@ class BasicAgent:
73
  "rpm": 15,
74
  "tpm": 1_000_000,
75
  },
76
- "fallbacks": ["gemini/gemini-2.0-flash-lite"]
77
  },
78
  {
79
  "model_name": "gemini-family",
@@ -83,11 +80,25 @@ class BasicAgent:
83
  "tpm": 1_000_000,
84
  },
85
  },
 
 
 
 
 
 
 
 
86
  ],
87
  client_kwargs={
88
  "routing_strategy": "usage-based-routing-v2"
89
  },
90
- num_retries=5,
 
 
 
 
 
 
91
  api_key=os.getenv("API_KEY"),
92
  )
93
  self.agent = CodeAgent(
 
55
  "rpm": 5,
56
  "tpm": 250_000,
57
  },
 
58
  },
59
  {
60
  "model_name": "gemini-family",
 
63
  "rpm": 10,
64
  "tpm": 250_000,
65
  },
 
66
  },
67
  {
68
  "model_name": "gemini-family",
 
71
  "rpm": 15,
72
  "tpm": 1_000_000,
73
  },
 
74
  },
75
  {
76
  "model_name": "gemini-family",
 
80
  "tpm": 1_000_000,
81
  },
82
  },
83
+ {
84
+ "model_name": "gemini-family",
85
+ "litellm_params": {
86
+ "model": "gemini/gemini-2.5-flash-lite-preview-06-17",
87
+ "rpm": 15,
88
+ "tpm": 250_000,
89
+ },
90
+ },
91
  ],
92
  client_kwargs={
93
  "routing_strategy": "usage-based-routing-v2"
94
  },
95
+ fallbacks=[
96
+ {"gemini-2.5-pro": "gemini-2.5-flash"},
97
+ {"gemini-2.5-flash": ["gemini-2.0-flash"]},
98
+ {"gemini-2.0-flash": ["gemini-2.0-flash-lite"]},
99
+ {"gemini-2.0-flash-lite": ["gemini-2.5-flash-lite-preview-06-17"]},
100
+ ],
101
+ num_retries=1,
102
  api_key=os.getenv("API_KEY"),
103
  )
104
  self.agent = CodeAgent(