slockers commited on
Commit
8b5f428
·
1 Parent(s): ea89d9d

added models

Browse files
Files changed (1) hide show
  1. config.yaml +89 -13
config.yaml CHANGED
@@ -1,7 +1,3 @@
1
- # aistudio gemini free, Rate Limits https://ai.google.dev/pricing#1_5pro
2
- # gemini-1.5-pro: 2 rpm, 32,000 tpm, 1,500 RPD
3
- # gemini-1.5-flash: 15 rpm, 1,000,000 tpm, 50 RPD
4
-
5
  model_list:
6
 
7
  # --------------gemini-2.0-flash-exp--------------------
@@ -99,20 +95,20 @@ model_list:
99
  model: huggingface/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
100
  api_key: os.environ/HUGGINGFACE_API_KEY1
101
 
102
- - model_name: hg2/DeepSeek-R1-Distill-Qwen-32B
103
- litellm_params:
104
- model: huggingface/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
105
- api_key: os.environ/HUGGINGFACE_API_KEY2
106
 
107
  - model_name: hg1/Llama-3.3-70B-Instruct
108
  litellm_params:
109
  model: huggingface/meta-llama/Llama-3.3-70B-Instruct
110
  api_key: os.environ/HUGGINGFACE_API_KEY1
111
 
112
- - model_name: hg2/Llama-3.3-70B-Instruct
113
- litellm_params:
114
- model: huggingface/meta-llama/Llama-3.3-70B-Instruct
115
- api_key: os.environ/HUGGINGFACE_API_KEY2
116
 
117
  # --------------hyperbolic--------------------
118
 
@@ -233,7 +229,87 @@ model_list:
233
  model: openai/meta-llama/Llama-3.3-70B-Instruct-Turbo
234
  api_base: os.environ/DDC_BASE_URL
235
  api_key: os.environ/DDC_API_KEY
 
 
236
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
237
  # --------------CB--------------------
238
 
239
  - model_name: cb/gpt-4o-mini
@@ -379,4 +455,4 @@ general_settings:
379
  router_settings:
380
  fallbacks: [{"or/gemini-2.0-flash-exp": ["gg1/gemini-2.0-flash-exp"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}]
381
  model_group_alias: {"gpt-4": "gemini-1.5-pro"}
382
- routing_strategy: simple-shuffle
 
 
 
 
 
1
  model_list:
2
 
3
  # --------------gemini-2.0-flash-exp--------------------
 
95
  model: huggingface/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
96
  api_key: os.environ/HUGGINGFACE_API_KEY1
97
 
98
+ # - model_name: hg2/DeepSeek-R1-Distill-Qwen-32B
99
+ # litellm_params:
100
+ # model: huggingface/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
101
+ # api_key: os.environ/HUGGINGFACE_API_KEY2
102
 
103
  - model_name: hg1/Llama-3.3-70B-Instruct
104
  litellm_params:
105
  model: huggingface/meta-llama/Llama-3.3-70B-Instruct
106
  api_key: os.environ/HUGGINGFACE_API_KEY1
107
 
108
+ # - model_name: hg2/Llama-3.3-70B-Instruct
109
+ # litellm_params:
110
+ # model: huggingface/meta-llama/Llama-3.3-70B-Instruct
111
+ # api_key: os.environ/HUGGINGFACE_API_KEY2
112
 
113
  # --------------hyperbolic--------------------
114
 
 
229
  model: openai/meta-llama/Llama-3.3-70B-Instruct-Turbo
230
  api_base: os.environ/DDC_BASE_URL
231
  api_key: os.environ/DDC_API_KEY
232
+
233
+ # --------------CB--------------------
234
 
235
+ - model_name: zk/gpt-4o-mini
236
+ litellm_params:
237
+ model: openai/gpt-4o-mini
238
+ api_base: os.environ/ZK_BASE_URL
239
+ api_key: os.environ/ZK_API_KEY
240
+
241
+ - model_name: zk/gpt-4o
242
+ litellm_params:
243
+ model: openai/gpt-4o-2024-11-20
244
+ api_base: os.environ/ZK_BASE_URL
245
+ api_key: os.environ/ZK_API_KEY
246
+
247
+ - model_name: zk/chatgpt-4o-latest
248
+ litellm_params:
249
+ model: openai/chatgpt-4o-latest
250
+ api_base: os.environ/ZK_BASE_URL
251
+ api_key: os.environ/ZK_API_KEY
252
+
253
+ - model_name: zk/o3-mini
254
+ litellm_params:
255
+ model: openai/o3-mini
256
+ api_base: os.environ/ZK_BASE_URL
257
+ api_key: os.environ/ZK_API_KEY
258
+
259
+ - model_name: zk/claude-3-5-haiku
260
+ litellm_params:
261
+ model: openai/claude-3-5-haiku-20241022
262
+ api_base: os.environ/ZK_BASE_URL
263
+ api_key: os.environ/ZK_API_KEY
264
+
265
+ - model_name: zk/claude-3-5-sonnet
266
+ litellm_params:
267
+ model: openai/claude-3-5-sonnet-20241022
268
+ api_base: os.environ/ZK_BASE_URL
269
+ api_key: os.environ/ZK_API_KEY
270
+
271
+ - model_name: zk/claude-3-5-sonnet-20240620
272
+ litellm_params:
273
+ model: openai/claude-3-5-sonnet-20240620
274
+ api_base: os.environ/ZK_BASE_URL
275
+ api_key: os.environ/ZK_API_KEY
276
+
277
+ - model_name: zk/deepseek-chat
278
+ litellm_params:
279
+ model: openai/deepseek-chat
280
+ api_base: os.environ/ZK_BASE_URL
281
+ api_key: os.environ/ZK_API_KEY
282
+
283
+ - model_name: zk/deepseek-reasoner
284
+ litellm_params:
285
+ model: openai/deepseek-reasoner
286
+ api_base: os.environ/ZK_BASE_URL
287
+ api_key: os.environ/ZK_API_KEY
288
+
289
+ - model_name: zk/llama-3.3-70b-instruct
290
+ litellm_params:
291
+ model: openai/llama-3.3-70b-instruct
292
+ api_base: os.environ/ZK_BASE_URL
293
+ api_key: os.environ/ZK_API_KEY
294
+
295
+ - model_name: zk/sonar-pro
296
+ litellm_params:
297
+ model: openai/sonar-pro
298
+ api_base: os.environ/ZK_BASE_URL
299
+ api_key: os.environ/ZK_API_KEY
300
+
301
+ - model_name: zk/sonar
302
+ litellm_params:
303
+ model: openai/sonar
304
+ api_base: os.environ/ZK_BASE_URL
305
+ api_key: os.environ/ZK_API_KEY
306
+
307
+ - model_name: zk/sonar-reasoning
308
+ litellm_params:
309
+ model: openai/sonar-reasoning
310
+ api_base: os.environ/ZK_BASE_URL
311
+ api_key: os.environ/ZK_API_KEY
312
+
313
  # --------------CB--------------------
314
 
315
  - model_name: cb/gpt-4o-mini
 
455
  router_settings:
456
  fallbacks: [{"or/gemini-2.0-flash-exp": ["gg1/gemini-2.0-flash-exp"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}]
457
  model_group_alias: {"gpt-4": "gemini-1.5-pro"}
458
+ routing_strategy: simple-shuffle