krinlove commited on
Commit
6c8c86d
·
verified ·
1 Parent(s): 9bbfd57

Update config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +285 -283
config.yaml CHANGED
@@ -2,317 +2,319 @@
2
  # gemini-1.5-pro: 2 rpm, 32,000 tpm, 1,500 RPD
3
  # gemini-1.5-flash: 15 rpm, 1,000,000 tpm, 50 RPD
4
 
5
- model_list:
6
- # northflank
7
- - model_name: gpt-4o-mini-northflank
8
- litellm_params:
9
- model: openai/gpt-4o-mini
10
- api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
11
- api_key: os.environ/NF_API_KEY
12
- - model_name: gpt-4o-mini
13
- litellm_params:
14
- model: openai/gpt-4o-mini
15
- api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
16
- api_key: os.environ/NF_API_KEY
17
- - model_name: gpt-3.5-turbo-northflank
18
- litellm_params:
19
- model: openai/gpt-3.5-turbo
20
- api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
21
- api_key: os.environ/NF_API_KEY
22
- - model_name: gpt-3.5-turbo
23
- litellm_params:
24
- model: openai/gpt-3.5-turbo
25
- api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
26
- api_key: os.environ/NF_API_KEY
27
 
28
- # github
29
- - model_name: gpt-4o-k1
30
- litellm_params:
31
- model: github/gpt-4o
32
- api_base: https://models.inference.ai.azure.com
33
- api_key: os.environ/GITHUB_API_KEY1
34
- - model_name: github/gpt-4o
35
- litellm_params:
36
- model: github/gpt-4o
37
- api_key: os.environ/GITHUB_API_KEY1
38
- rpm: 30 # 15 * # of keys
39
- tpm: 2000000 # 1,000,000 * # of keys
40
 
41
- - model_name: gpt-4o-k2
42
- litellm_params:
43
- model: github/gpt-4o
44
- api_base: https://models.inference.ai.azure.com
45
- api_key: os.environ/GITHUB_API_KEY2
46
- - model_name: github/gpt-4o
47
- litellm_params:
48
- model: github/gpt-4o
49
- api_key: os.environ/GITHUB_API_KEY2
50
- rpm: 30 # 15 * # of keys
51
- tpm: 2000000 # 1,000,000 * # of keys
52
 
53
- - model_name: Mistral-large-2411-k1
54
- litellm_params:
55
- model: github/Mistral-large-2411
56
- api_base: https://models.inference.ai.azure.com
57
- api_key: os.environ/GITHUB_API_KEY1
58
- - model_name: github/Mistral-large-2411
59
- litellm_params:
60
- model: github/Mistral-large-2411
61
- api_key: os.environ/GITHUB_API_KEY1
62
- rpm: 30 # 15 * # of keys
63
- tpm: 2000000 # 1,000,000 * # of keys
64
 
65
- - model_name: Mistral-large-2411-k2
66
- litellm_params:
67
- model: github/Mistral-large-2411
68
- api_base: https://models.inference.ai.azure.com
69
- api_key: os.environ/GITHUB_API_KEY2
70
- - model_name: github/Mistral-large-2411
71
- litellm_params:
72
- model: github/Mistral-large-2411
73
- api_key: os.environ/GITHUB_API_KEY2
74
- rpm: 30 # 15 * # of keys
75
- tpm: 2000000 # 1,000,000 * # of keys
76
 
77
- - model_name: gpt-4o-mini-k1
78
- litellm_params:
79
- model: github/gpt-4o-mini
80
- api_base: https://models.inference.ai.azure.com
81
- api_key: os.environ/GITHUB_API_KEY1
82
- - model_name: github/gpt-4o-mini
83
- litellm_params:
84
- model: github/gpt-4o-mini
85
- api_key: os.environ/GITHUB_API_KEY1
86
- rpm: 30 # 15 * # of keys
87
- tpm: 2000000 # 1,000,000 * # of keys
88
 
89
- - model_name: gpt-4o-mini-k2
90
- litellm_params:
91
- model: github/gpt-4o-mini
92
- api_base: https://models.inference.ai.azure.com
93
- api_key: os.environ/GITHUB_API_KEY2
94
- - model_name: github/gpt-4o-mini
95
- litellm_params:
96
- model: github/gpt-4o-mini
97
- api_key: os.environ/GITHUB_API_KEY2
98
- rpm: 30 # 15 * # of keys
99
- tpm: 2000000 # 1,000,000 * # of keys
100
 
101
- # --------------gemini-1.5-pro--------------------
102
- - model_name: gemini-1.5-pro-k1
103
- litellm_params:
104
- model: gemini/gemini-1.5-pro
105
- api_key: os.environ/GEMINI_API_KEY1
106
- - model_name: gemini-1.5-pro
107
- litellm_params:
108
- model: gemini/gemini-1.5-pro
109
- api_key: os.environ/GEMINI_API_KEY1
110
- rpm: 4 # 2 * # of keys
111
- tpm: 6400 # 32,000 * # of keys
112
- - model_name: gemini-1.5-pro-k2
113
- litellm_params:
114
- model: gemini/gemini-1.5-pro
115
- api_key: os.environ/GEMINI_API_KEY2
116
- - model_name: gemini-1.5-pro
117
- litellm_params:
118
- model: gemini/gemini-1.5-pro
119
- api_key: os.environ/GEMINI_API_KEY
120
- rpm: 4 # 2 * # of keys
121
- tpm: 6400 # 32,000 * # of keys
122
 
123
- - model_name: gemini-1.5-pro-002-k1
124
- litellm_params:
125
- model: gemini/gemini-1.5-pro-002
126
- api_key: os.environ/GEMINI_API_KEY1
127
- - model_name: gemini-1.5-pro-002
128
- litellm_params:
129
- model: gemini/gemini-1.5-flash-002
130
- api_key: os.environ/GEMINI_API_KEY1
131
- rpm: 75 # 15 * # of keys
132
- tpm: 5000000 # 1,000,000 * # of keys
133
 
134
- - model_name: gemini-1.5-pro-002-k2
135
- litellm_params:
136
- model: gemini/gemini-1.5-pro-002
137
- api_key: os.environ/GEMINI_API_KEY2
138
- - model_name: gemini-1.5-pro-002
139
- litellm_params:
140
- model: gemini/gemini-1.5-pro-002
141
- api_key: os.environ/GEMINI_API_KEY2
142
- rpm: 75 # 15 * # of keys
143
- tpm: 5000000 # 1,000,000 * # of keys
144
 
145
- - model_name: gemini-1.5-pro-exp-k1
146
- litellm_params:
147
- model: gemini/gemini-1.5-pro-exp
148
- api_key: os.environ/GEMINI_API_KEY1
149
- - model_name: gemini-1.5-pro-exp
150
- litellm_params:
151
- model: gemini/gemini-1.5-pro-exp
152
- api_key: os.environ/GEMINI_API_KEY1
153
- rpm: 75 # 15 * # of keys
154
- tpm: 5000000 # 1,000,000 * # of keys
155
 
156
- - model_name: gemini-1.5-pro-exp-k2
157
- litellm_params:
158
- model: gemini/gemini-1.5-pro-exp
159
- api_key: os.environ/GEMINI_API_KEY2
160
- - model_name: gemini-1.5-pro-exp
161
- litellm_params:
162
- model: gemini/gemini-1.5-pro-exp
163
- api_key: os.environ/GEMINI_API_KEY2
164
- rpm: 75 # 15 * # of keys
165
- tpm: 5000000 # 1,000,000 * # of keys
166
 
167
- # --------------gemini-2.0-flash-exp--------------------
168
- - model_name: gemini-2.0-flash-exp-k1
169
- litellm_params:
170
- model: gemini/gemini-2.0-flash-exp
171
- api_key: os.environ/GEMINI_API_KEY1
172
- - model_name: gemini-2.0-flash-exp
173
- litellm_params:
174
- model: gemini/gemini-2.0-flash-exp
175
- api_key: os.environ/GEMINI_API_KEY1
176
- rpm: 50 # 2 * # of keys
177
- tpm: 5000000 # 32,000 * # of keys
178
 
179
- - model_name: gemini-2.0-flash-exp-k2
180
- litellm_params:
181
- model: gemini/gemini-2.0-flash-exp
182
- api_key: os.environ/GEMINI_API_KEY2
183
- - model_name: gemini-2.0-flash-exp
184
- litellm_params:
185
- model: gemini/gemini-2.0-flash-exp
186
- api_key: os.environ/GEMINI_API_KEY2
187
- rpm: 50 # 2 * # of keys
188
- tpm: 5000000 # 32,000 * # of keys
189
 
190
- - model_name: gemini-2.0-flash-thinking-exp-k1
191
- litellm_params:
192
- model: gemini/gemini-2.0-flash-thinking-exp
193
- api_key: os.environ/GEMINI_API_KEY1
194
- - model_name: gemini-2.0-flash-thinking-exp
195
- litellm_params:
196
- model: gemini/gemini-2.0-flash-thinking-exp
197
- api_key: os.environ/GEMINI_API_KEY1
198
- rpm: 50 # 2 * # of keys
199
- tpm: 5000000 # 32,000 * # of keys
200
 
201
- - model_name: gemini-2.0-flash-thinking-exp-k2
202
- litellm_params:
203
- model: gemini/gemini-2.0-flash-thinking-exp
204
- api_key: os.environ/GEMINI_API_KEY2
205
- - model_name: gemini-2.0-flash-thinking-exp
206
- litellm_params:
207
- model: gemini/gemini-2.0-flash-thinking-exp
208
- api_key: os.environ/GEMINI_API_KEY2
209
- rpm: 50 # 2 * # of keys
210
- tpm: 5000000 # 32,000 * # of keys
211
 
212
- - model_name: gemini-2.0-flash-thinking-exp-1219-k1
213
- litellm_params:
214
- model: gemini/gemini-2.0-flash-thinking-exp-1219
215
- api_key: os.environ/GEMINI_API_KEY1
216
- - model_name: gemini-2.0-flash-thinking-exp-1219
217
- litellm_params:
218
- model: gemini/gemini-2.0-flash-thinking-exp-1219
219
- api_key: os.environ/GEMINI_API_KEY1
220
- rpm: 50 # 2 * # of keys
221
- tpm: 5000000 # 32,000 * # of keys
222
 
223
- - model_name: gemini-2.0-flash-thinking-exp-1219-k2
224
- litellm_params:
225
- model: gemini/gemini-2.0-flash-thinking-exp-1219
226
- api_key: os.environ/GEMINI_API_KEY2
227
- - model_name: gemini-2.0-flash-thinking-exp-1219
228
- litellm_params:
229
- model: gemini/gemini-2.0-flash-thinking-exp-1219
230
- api_key: os.environ/GEMINI_API_KEY2
231
- rpm: 50 # 2 * # of keys
232
- tpm: 5000000 # 32,000 * # of keys
233
 
234
- # --------------gemini-exp-1206--------------------
235
- - model_name: gemini-exp-1206-k1
236
- litellm_params:
237
- model: gemini/gemini-exp-1206
238
- api_key: os.environ/GEMINI_API_KEY1
239
- - model_name: gemini-exp-1206
240
- litellm_params:
241
- model: gemini/gemini-exp-1206
242
- api_key: os.environ/GEMINI_API_KEY1
243
- rpm: 20 # 2 * # of keys
244
- tpm: 5000000 # 32,000 * # of keys
245
 
246
- - model_name: gemini-exp-1206-k2
247
- litellm_params:
248
- model: gemini/gemini-exp-1206
249
- api_key: os.environ/GEMINI_API_KEY2
250
- - model_name: gemini-exp-1206
251
- litellm_params:
252
- model: gemini/gemini-exp-1206
253
- api_key: os.environ/GEMINI_API_KEY2
254
- rpm: 20 # 2 * # of keys
255
- tpm: 5000000 # 32,000 * # of keys
256
 
257
- # --------------gemini-exp-1121--------------------
258
- - model_name: gemini-exp-1121-k1
259
- litellm_params:
260
- model: gemini/gemini-exp-1121
261
- api_key: os.environ/GEMINI_API_KEY1
262
- - model_name: gemini-exp-1121
263
- litellm_params:
264
- model: gemini/gemini-exp-1121
265
- api_key: os.environ/GEMINI_API_KEY1
266
- rpm: 20 # 2 * # of keys
267
- tpm: 5000000 # 32,000 * # of keys
268
 
269
- - model_name: gemini-exp-1121-k2
270
- litellm_params:
271
- model: gemini/gemini-exp-1121
272
- api_key: os.environ/GEMINI_API_KEY2
273
- - model_name: gemini-exp-1121
274
- litellm_params:
275
- model: gemini/gemini-exp-1121
276
- api_key: os.environ/GEMINI_API_KEY2
277
- rpm: 20 # 2 * # of keys
278
- tpm: 5000000 # 32,000 * # of keys
279
 
280
- # --------------gemini-exp-1114--------------------
281
- - model_name: gemini-exp-1114-k1
282
- litellm_params:
283
- model: gemini/gemini-exp-1114
284
- api_key: os.environ/GEMINI_API_KEY1
285
- - model_name: gemini-exp-1114
286
- litellm_params:
287
- model: gemini/gemini-exp-1114
288
- api_key: os.environ/GEMINI_API_KEY1
289
- rpm: 20 # 2 * # of keys
290
- tpm: 5000000 # 32,000 * # of keys
291
 
292
- - model_name: gemini-exp-1114-k2
293
- litellm_params:
294
- model: gemini/gemini-exp-1114
295
- api_key: os.environ/GEMINI_API_KEY2
296
- - model_name: gemini-exp-1114
297
- litellm_params:
298
- model: gemini/gemini-exp-1114
299
- api_key: os.environ/GEMINI_API_KEY2
300
- rpm: 20 # 2 * # of keys
301
- tpm: 5000000 # 32,000 * # of keys
302
 
303
  litellm_settings:
304
  # Networking settings
305
- request_timeout: 20 # (int) llm request timeout in seconds. Raise Timeout error if call takes longer than 10s. Sets litellm.request_timeout
306
- num_retries: 3
307
- fallbacks: [{"gemini-1.5-pro": ["gemini-1.5-flash"]}]
308
- allowed_fails: 3 # cooldown model if it fails > 1 call in a minute.
309
- cooldown_time: 30 # how long to cooldown model if fails/min > allowed_fails
 
 
310
  drop_params: true
311
 
312
  general_settings:
313
  master_key: os.environ/MASTER_KEY # sk-1234 # [OPTIONAL] Only use this if you require all calls to contain this key (Authorization: Bearer sk-1234)
314
 
315
- router_settings:
316
- fallbacks: [{"gpt-4o-mini": ["gemini-1.5-flash"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}]
317
- model_group_alias: {"gpt-4": "gemini-1.5-pro"}
318
- routing_strategy: simple-shuffle
 
2
  # gemini-1.5-pro: 2 rpm, 32,000 tpm, 1,500 RPD
3
  # gemini-1.5-flash: 15 rpm, 1,000,000 tpm, 50 RPD
4
 
5
+ # model_list:
6
+ # # northflank
7
+ # - model_name: gpt-4o-mini-northflank
8
+ # litellm_params:
9
+ # model: openai/gpt-4o-mini
10
+ # api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
11
+ # api_key: os.environ/NF_API_KEY
12
+ # - model_name: gpt-4o-mini
13
+ # litellm_params:
14
+ # model: openai/gpt-4o-mini
15
+ # api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
16
+ # api_key: os.environ/NF_API_KEY
17
+ # - model_name: gpt-3.5-turbo-northflank
18
+ # litellm_params:
19
+ # model: openai/gpt-3.5-turbo
20
+ # api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
21
+ # api_key: os.environ/NF_API_KEY
22
+ # - model_name: gpt-3.5-turbo
23
+ # litellm_params:
24
+ # model: openai/gpt-3.5-turbo
25
+ # api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1
26
+ # api_key: os.environ/NF_API_KEY
27
 
28
+ # # github
29
+ # - model_name: gpt-4o-k1
30
+ # litellm_params:
31
+ # model: github/gpt-4o
32
+ # api_base: https://models.inference.ai.azure.com
33
+ # api_key: os.environ/GITHUB_API_KEY1
34
+ # - model_name: github/gpt-4o
35
+ # litellm_params:
36
+ # model: github/gpt-4o
37
+ # api_key: os.environ/GITHUB_API_KEY1
38
+ # rpm: 30 # 15 * # of keys
39
+ # tpm: 2000000 # 1,000,000 * # of keys
40
 
41
+ # - model_name: gpt-4o-k2
42
+ # litellm_params:
43
+ # model: github/gpt-4o
44
+ # api_base: https://models.inference.ai.azure.com
45
+ # api_key: os.environ/GITHUB_API_KEY2
46
+ # - model_name: github/gpt-4o
47
+ # litellm_params:
48
+ # model: github/gpt-4o
49
+ # api_key: os.environ/GITHUB_API_KEY2
50
+ # rpm: 30 # 15 * # of keys
51
+ # tpm: 2000000 # 1,000,000 * # of keys
52
 
53
+ # - model_name: Mistral-large-2411-k1
54
+ # litellm_params:
55
+ # model: github/Mistral-large-2411
56
+ # api_base: https://models.inference.ai.azure.com
57
+ # api_key: os.environ/GITHUB_API_KEY1
58
+ # - model_name: github/Mistral-large-2411
59
+ # litellm_params:
60
+ # model: github/Mistral-large-2411
61
+ # api_key: os.environ/GITHUB_API_KEY1
62
+ # rpm: 30 # 15 * # of keys
63
+ # tpm: 2000000 # 1,000,000 * # of keys
64
 
65
+ # - model_name: Mistral-large-2411-k2
66
+ # litellm_params:
67
+ # model: github/Mistral-large-2411
68
+ # api_base: https://models.inference.ai.azure.com
69
+ # api_key: os.environ/GITHUB_API_KEY2
70
+ # - model_name: github/Mistral-large-2411
71
+ # litellm_params:
72
+ # model: github/Mistral-large-2411
73
+ # api_key: os.environ/GITHUB_API_KEY2
74
+ # rpm: 30 # 15 * # of keys
75
+ # tpm: 2000000 # 1,000,000 * # of keys
76
 
77
+ # - model_name: gpt-4o-mini-k1
78
+ # litellm_params:
79
+ # model: github/gpt-4o-mini
80
+ # api_base: https://models.inference.ai.azure.com
81
+ # api_key: os.environ/GITHUB_API_KEY1
82
+ # - model_name: github/gpt-4o-mini
83
+ # litellm_params:
84
+ # model: github/gpt-4o-mini
85
+ # api_key: os.environ/GITHUB_API_KEY1
86
+ # rpm: 30 # 15 * # of keys
87
+ # tpm: 2000000 # 1,000,000 * # of keys
88
 
89
+ # - model_name: gpt-4o-mini-k2
90
+ # litellm_params:
91
+ # model: github/gpt-4o-mini
92
+ # api_base: https://models.inference.ai.azure.com
93
+ # api_key: os.environ/GITHUB_API_KEY2
94
+ # - model_name: github/gpt-4o-mini
95
+ # litellm_params:
96
+ # model: github/gpt-4o-mini
97
+ # api_key: os.environ/GITHUB_API_KEY2
98
+ # rpm: 30 # 15 * # of keys
99
+ # tpm: 2000000 # 1,000,000 * # of keys
100
 
101
+ # # --------------gemini-1.5-pro--------------------
102
+ # - model_name: gemini-1.5-pro-k1
103
+ # litellm_params:
104
+ # model: gemini/gemini-1.5-pro
105
+ # api_key: os.environ/GEMINI_API_KEY1
106
+ # - model_name: gemini-1.5-pro
107
+ # litellm_params:
108
+ # model: gemini/gemini-1.5-pro
109
+ # api_key: os.environ/GEMINI_API_KEY1
110
+ # rpm: 4 # 2 * # of keys
111
+ # tpm: 6400 # 32,000 * # of keys
112
+ # - model_name: gemini-1.5-pro-k2
113
+ # litellm_params:
114
+ # model: gemini/gemini-1.5-pro
115
+ # api_key: os.environ/GEMINI_API_KEY2
116
+ # - model_name: gemini-1.5-pro
117
+ # litellm_params:
118
+ # model: gemini/gemini-1.5-pro
119
+ # api_key: os.environ/GEMINI_API_KEY
120
+ # rpm: 4 # 2 * # of keys
121
+ # tpm: 6400 # 32,000 * # of keys
122
 
123
+ # - model_name: gemini-1.5-pro-002-k1
124
+ # litellm_params:
125
+ # model: gemini/gemini-1.5-pro-002
126
+ # api_key: os.environ/GEMINI_API_KEY1
127
+ # - model_name: gemini-1.5-pro-002
128
+ # litellm_params:
129
+ # model: gemini/gemini-1.5-flash-002
130
+ # api_key: os.environ/GEMINI_API_KEY1
131
+ # rpm: 75 # 15 * # of keys
132
+ # tpm: 5000000 # 1,000,000 * # of keys
133
 
134
+ # - model_name: gemini-1.5-pro-002-k2
135
+ # litellm_params:
136
+ # model: gemini/gemini-1.5-pro-002
137
+ # api_key: os.environ/GEMINI_API_KEY2
138
+ # - model_name: gemini-1.5-pro-002
139
+ # litellm_params:
140
+ # model: gemini/gemini-1.5-pro-002
141
+ # api_key: os.environ/GEMINI_API_KEY2
142
+ # rpm: 75 # 15 * # of keys
143
+ # tpm: 5000000 # 1,000,000 * # of keys
144
 
145
+ # - model_name: gemini-1.5-pro-exp-k1
146
+ # litellm_params:
147
+ # model: gemini/gemini-1.5-pro-exp
148
+ # api_key: os.environ/GEMINI_API_KEY1
149
+ # - model_name: gemini-1.5-pro-exp
150
+ # litellm_params:
151
+ # model: gemini/gemini-1.5-pro-exp
152
+ # api_key: os.environ/GEMINI_API_KEY1
153
+ # rpm: 75 # 15 * # of keys
154
+ # tpm: 5000000 # 1,000,000 * # of keys
155
 
156
+ # - model_name: gemini-1.5-pro-exp-k2
157
+ # litellm_params:
158
+ # model: gemini/gemini-1.5-pro-exp
159
+ # api_key: os.environ/GEMINI_API_KEY2
160
+ # - model_name: gemini-1.5-pro-exp
161
+ # litellm_params:
162
+ # model: gemini/gemini-1.5-pro-exp
163
+ # api_key: os.environ/GEMINI_API_KEY2
164
+ # rpm: 75 # 15 * # of keys
165
+ # tpm: 5000000 # 1,000,000 * # of keys
166
 
167
+ # # --------------gemini-2.0-flash-exp--------------------
168
+ # - model_name: gemini-2.0-flash-exp-k1
169
+ # litellm_params:
170
+ # model: gemini/gemini-2.0-flash-exp
171
+ # api_key: os.environ/GEMINI_API_KEY1
172
+ # - model_name: gemini-2.0-flash-exp
173
+ # litellm_params:
174
+ # model: gemini/gemini-2.0-flash-exp
175
+ # api_key: os.environ/GEMINI_API_KEY1
176
+ # rpm: 50 # 2 * # of keys
177
+ # tpm: 5000000 # 32,000 * # of keys
178
 
179
+ # - model_name: gemini-2.0-flash-exp-k2
180
+ # litellm_params:
181
+ # model: gemini/gemini-2.0-flash-exp
182
+ # api_key: os.environ/GEMINI_API_KEY2
183
+ # - model_name: gemini-2.0-flash-exp
184
+ # litellm_params:
185
+ # model: gemini/gemini-2.0-flash-exp
186
+ # api_key: os.environ/GEMINI_API_KEY2
187
+ # rpm: 50 # 2 * # of keys
188
+ # tpm: 5000000 # 32,000 * # of keys
189
 
190
+ # - model_name: gemini-2.0-flash-thinking-exp-k1
191
+ # litellm_params:
192
+ # model: gemini/gemini-2.0-flash-thinking-exp
193
+ # api_key: os.environ/GEMINI_API_KEY1
194
+ # - model_name: gemini-2.0-flash-thinking-exp
195
+ # litellm_params:
196
+ # model: gemini/gemini-2.0-flash-thinking-exp
197
+ # api_key: os.environ/GEMINI_API_KEY1
198
+ # rpm: 50 # 2 * # of keys
199
+ # tpm: 5000000 # 32,000 * # of keys
200
 
201
+ # - model_name: gemini-2.0-flash-thinking-exp-k2
202
+ # litellm_params:
203
+ # model: gemini/gemini-2.0-flash-thinking-exp
204
+ # api_key: os.environ/GEMINI_API_KEY2
205
+ # - model_name: gemini-2.0-flash-thinking-exp
206
+ # litellm_params:
207
+ # model: gemini/gemini-2.0-flash-thinking-exp
208
+ # api_key: os.environ/GEMINI_API_KEY2
209
+ # rpm: 50 # 2 * # of keys
210
+ # tpm: 5000000 # 32,000 * # of keys
211
 
212
+ # - model_name: gemini-2.0-flash-thinking-exp-1219-k1
213
+ # litellm_params:
214
+ # model: gemini/gemini-2.0-flash-thinking-exp-1219
215
+ # api_key: os.environ/GEMINI_API_KEY1
216
+ # - model_name: gemini-2.0-flash-thinking-exp-1219
217
+ # litellm_params:
218
+ # model: gemini/gemini-2.0-flash-thinking-exp-1219
219
+ # api_key: os.environ/GEMINI_API_KEY1
220
+ # rpm: 50 # 2 * # of keys
221
+ # tpm: 5000000 # 32,000 * # of keys
222
 
223
+ # - model_name: gemini-2.0-flash-thinking-exp-1219-k2
224
+ # litellm_params:
225
+ # model: gemini/gemini-2.0-flash-thinking-exp-1219
226
+ # api_key: os.environ/GEMINI_API_KEY2
227
+ # - model_name: gemini-2.0-flash-thinking-exp-1219
228
+ # litellm_params:
229
+ # model: gemini/gemini-2.0-flash-thinking-exp-1219
230
+ # api_key: os.environ/GEMINI_API_KEY2
231
+ # rpm: 50 # 2 * # of keys
232
+ # tpm: 5000000 # 32,000 * # of keys
233
 
234
+ # # --------------gemini-exp-1206--------------------
235
+ # - model_name: gemini-exp-1206-k1
236
+ # litellm_params:
237
+ # model: gemini/gemini-exp-1206
238
+ # api_key: os.environ/GEMINI_API_KEY1
239
+ # - model_name: gemini-exp-1206
240
+ # litellm_params:
241
+ # model: gemini/gemini-exp-1206
242
+ # api_key: os.environ/GEMINI_API_KEY1
243
+ # rpm: 20 # 2 * # of keys
244
+ # tpm: 5000000 # 32,000 * # of keys
245
 
246
+ # - model_name: gemini-exp-1206-k2
247
+ # litellm_params:
248
+ # model: gemini/gemini-exp-1206
249
+ # api_key: os.environ/GEMINI_API_KEY2
250
+ # - model_name: gemini-exp-1206
251
+ # litellm_params:
252
+ # model: gemini/gemini-exp-1206
253
+ # api_key: os.environ/GEMINI_API_KEY2
254
+ # rpm: 20 # 2 * # of keys
255
+ # tpm: 5000000 # 32,000 * # of keys
256
 
257
+ # # --------------gemini-exp-1121--------------------
258
+ # - model_name: gemini-exp-1121-k1
259
+ # litellm_params:
260
+ # model: gemini/gemini-exp-1121
261
+ # api_key: os.environ/GEMINI_API_KEY1
262
+ # - model_name: gemini-exp-1121
263
+ # litellm_params:
264
+ # model: gemini/gemini-exp-1121
265
+ # api_key: os.environ/GEMINI_API_KEY1
266
+ # rpm: 20 # 2 * # of keys
267
+ # tpm: 5000000 # 32,000 * # of keys
268
 
269
+ # - model_name: gemini-exp-1121-k2
270
+ # litellm_params:
271
+ # model: gemini/gemini-exp-1121
272
+ # api_key: os.environ/GEMINI_API_KEY2
273
+ # - model_name: gemini-exp-1121
274
+ # litellm_params:
275
+ # model: gemini/gemini-exp-1121
276
+ # api_key: os.environ/GEMINI_API_KEY2
277
+ # rpm: 20 # 2 * # of keys
278
+ # tpm: 5000000 # 32,000 * # of keys
279
 
280
+ # # --------------gemini-exp-1114--------------------
281
+ # - model_name: gemini-exp-1114-k1
282
+ # litellm_params:
283
+ # model: gemini/gemini-exp-1114
284
+ # api_key: os.environ/GEMINI_API_KEY1
285
+ # - model_name: gemini-exp-1114
286
+ # litellm_params:
287
+ # model: gemini/gemini-exp-1114
288
+ # api_key: os.environ/GEMINI_API_KEY1
289
+ # rpm: 20 # 2 * # of keys
290
+ # tpm: 5000000 # 32,000 * # of keys
291
 
292
+ # - model_name: gemini-exp-1114-k2
293
+ # litellm_params:
294
+ # model: gemini/gemini-exp-1114
295
+ # api_key: os.environ/GEMINI_API_KEY2
296
+ # - model_name: gemini-exp-1114
297
+ # litellm_params:
298
+ # model: gemini/gemini-exp-1114
299
+ # api_key: os.environ/GEMINI_API_KEY2
300
+ # rpm: 20 # 2 * # of keys
301
+ # tpm: 5000000 # 32,000 * # of keys
302
 
303
  litellm_settings:
304
  # Networking settings
305
+ # request_timeout: 20 # (int) llm request timeout in seconds. Raise Timeout error if call takes longer than 10s. Sets litellm.request_timeout
306
+ # num_retries: 3
307
+ # fallbacks: [{"gemini-1.5-pro": ["gemini-1.5-flash"]}]
308
+ # allowed_fails: 3 # cooldown model if it fails > 1 call in a minute.
309
+ # cooldown_time: 30 # how long to cooldown model if fails/min > allowed_fails
310
+ success_callback: ["langfuse"]
311
+ failure_callback: ["langfuse"]
312
  drop_params: true
313
 
314
  general_settings:
315
  master_key: os.environ/MASTER_KEY # sk-1234 # [OPTIONAL] Only use this if you require all calls to contain this key (Authorization: Bearer sk-1234)
316
 
317
+ # router_settings:
318
+ # fallbacks: [{"gpt-4o-mini": ["gemini-1.5-flash"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}]
319
+ # model_group_alias: {"gpt-4": "gemini-1.5-pro"}
320
+ # routing_strategy: simple-shuffle