ffreemt commited on
Commit
4279fc2
·
1 Parent(s): 6fa4744

num_workers 4

Browse files
Files changed (3) hide show
  1. Dockerfile +3 -3
  2. litellm_config-bk.yaml +112 -0
  3. litellm_config.yaml +6 -2
Dockerfile CHANGED
@@ -15,7 +15,7 @@
15
 
16
  from ghcr.io/berriai/litellm:main-latest
17
 
18
- # SERVER_ROOT_PATH=/hf/v1
19
  # ENV LITELLM_LOG=DEBUG
20
  ENV STORE_MODEL_IN_DB=true
21
  ENV TZ=Asia/Shanghai OPENAI_API_KEY=any SERVER_ROOT_PATH=/v1 CONFIG_FILE_PATH=/app/config.yaml
@@ -23,10 +23,10 @@ ENV TZ=Asia/Shanghai OPENAI_API_KEY=any SERVER_ROOT_PATH=/v1 CONFIG_FILE_PATH=/a
23
  COPY ./litellm_config.yaml /app/config.yaml
24
  EXPOSE 7860
25
 
26
- ENTRYPOINT ["litellm"]
27
 
28
  # "--num_workers", "8"
29
  # env CONFIG_FILE_PATH=/app/config.yaml
30
  # CMD [ "--config", "/app/config.yaml", "--port", "7860", "--num_workers", "2" ]
31
 
32
- CMD [ "--port", "7860", "--num_workers", "8" ]
 
15
 
16
  from ghcr.io/berriai/litellm:main-latest
17
 
18
+ # SERVER_ROOT_PATH=/hf/v1
19
  # ENV LITELLM_LOG=DEBUG
20
  ENV STORE_MODEL_IN_DB=true
21
  ENV TZ=Asia/Shanghai OPENAI_API_KEY=any SERVER_ROOT_PATH=/v1 CONFIG_FILE_PATH=/app/config.yaml
 
23
  COPY ./litellm_config.yaml /app/config.yaml
24
  EXPOSE 7860
25
 
26
+ ENTRYPOINT ["litellm"]
27
 
28
  # "--num_workers", "8"
29
  # env CONFIG_FILE_PATH=/app/config.yaml
30
  # CMD [ "--config", "/app/config.yaml", "--port", "7860", "--num_workers", "2" ]
31
 
32
+ CMD [ "--port", "7860", "--num_workers", "4" ]
litellm_config-bk.yaml ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_list:
2
+ # - model_name: "anthropic/*"
3
+ # litellm_params:
4
+ # model: "openrouter/qwen/qwen3-coder" # Qwen/Qwen3-Coder-480B-A35B-Instruct
5
+ # max_tokens: 65536
6
+ # repetition_penalty: 1.05
7
+ # temperature: 0.7
8
+ # top_k: 20
9
+ # top_p: 0.8
10
+
11
+ # OK curl, ccr not OK, ccapi use litellm-v0 OK, anthropic-curl OK
12
+ - model_name: v0-a
13
+ litellm_params:
14
+ model: v0/v0-1.5-md
15
+ api_base: https://api.v0.dev/v1
16
+ api_key: os.environ/V0_API_KEY1
17
+ model_info:
18
+ max_tokens: 200_000
19
+ id: v0/v0-1.5-md
20
+ additionalProp1:
21
+ info: v0-bug-team
22
+ - model_name: v0-b
23
+ litellm_params:
24
+ model: v0/v0-1.5-md
25
+ api_base: https://api.v0.dev/v1
26
+ api_key: os.environ/V0_API_KEY2
27
+ - model_name: v0-c
28
+ litellm_params:
29
+ model: v0/v0-1.5-md
30
+ api_base: https://api.v0.dev/v1
31
+ api_key: os.environ/V0_API_KEY3
32
+ - model_name: v0
33
+ litellm_params:
34
+ model: v0/v0-1.5-md
35
+ api_base: https://api.v0.dev/v1
36
+ api_key: os.environ/V0_API_KEY1
37
+ model_info:
38
+ max_tokens: 200_000
39
+ id: v0/v0-1.5-md
40
+ additionalProp1:
41
+ info: v0-bug-team
42
+ - model_name: v0
43
+ litellm_params:
44
+ model: v0/v0-1.5-md
45
+ api_base: https://api.v0.dev/v1
46
+ api_key: os.environ/V0_API_KEY2
47
+ - model_name: v0
48
+ litellm_params:
49
+ model: v0/v0-1.5-md
50
+ api_base: https://api.v0.dev/v1
51
+ api_key: os.environ/V0_API_KEY3
52
+
53
+ # https://elysiver.h-e.top/v1 sk-JE5JTfpHyV2Ri648gr1dJY9BhIhOPtD3iOd0F1vuYoXHCIhH kimi-k2.5
54
+ - model_name: kimi-k2.5-elysiver
55
+ litellm_params:
56
+ model: openai/kimi-k2.5
57
+ api_base: https://elysiver.h-e.top/v1
58
+ api_key: os.environ/ELY_API_KEY
59
+ - model_name: kimi-k2.5
60
+ litellm_params:
61
+ model: openai/kimi-k2.5
62
+ api_base: https://elysiver.h-e.top/v1
63
+ api_key: os.environ/ELY_API_KEY
64
+ - model_name: gemini-2.5-flash-lite-elysiver
65
+ litellm_params:
66
+ model: openai/gemini-2.5-flash-lite
67
+ api_base: https://elysiver.h-e.top/v1
68
+ api_key: os.environ/ELY_API_KEY
69
+ - model_name: gemini-2.5-flash-lite
70
+ litellm_params:
71
+ model: openai/gemini-2.5-flash-lite
72
+ api_base: https://elysiver.h-e.top/v1
73
+ api_key: os.environ/ELY_API_KEY
74
+
75
+ - model_name: claude-sonnet-4
76
+ litellm_params:
77
+ model: openrouter/claude-sonnet-4
78
+ api_base: https://aidrouter.qzz.io/v1
79
+ api_key: os.environ/AIDROUTER_API_KEY
80
+ - model_name: claude-opus-4-6
81
+ litellm_params:
82
+ model: openrouter/claude-opus-4-6
83
+ api_base: https://aidrouter.qzz.io/v1
84
+ api_key: os.environ/AIDROUTER_API_KEY
85
+ - model_name: gemini-3-flash-preview
86
+ litellm_params:
87
+ model: openrouter/gemini-3-flash-preview
88
+ api_base: https://aidrouter.qzz.io/v1
89
+ api_key: os.environ/AIDROUTER_API_KEY
90
+
91
+ general_settings:
92
+ # master_key: "sk-1234" # Disabled for easy testing
93
+ # master_key: ${LITELLM_MASTER_KEY}
94
+ master_key: os.environ/LITELLM_MASTER_KEY
95
+
96
+ # litellm --config parent_config.yaml --detailed_debug/--debug
97
+ # os.environ["LITELLM_LOG"] = "INFO" os.environ["LITELLM_LOG"] = "DEBUG"
98
+ # https://docs.litellm.ai/docs/proxy/config_settings
99
+ litellm_settings:
100
+ # set_verbose: true # deprecated, use `os.environ['LITELLM_LOG'] = 'DEBUG'
101
+ request_timeout: 180
102
+ drop_params: true
103
+ fallbacks:
104
+ - v0: [gemini-2.5-flash-lite,gemini-2.5-flash]
105
+ - kimi-k2.5: [gemini-2.5-flash-lite]
106
+ # - gemini-2.5-flash: [gemini-2.5-flash-lite]
107
+ router_settings:
108
+ model_group_alias:
109
+ gpt-4o: gemini-2.5-flash-lite
110
+ gpt-4.1-mini: gemini-2.5-flash-lite
111
+ gpt-5-codex: kimi-k2.5
112
+ gpt-5.1-codex: kimi-k2.5
litellm_config.yaml CHANGED
@@ -103,10 +103,14 @@ litellm_settings:
103
  fallbacks:
104
  - v0: [gemini-2.5-flash-lite,gemini-2.5-flash]
105
  - kimi-k2.5: [gemini-2.5-flash-lite]
 
 
 
106
  # - gemini-2.5-flash: [gemini-2.5-flash-lite]
 
107
  router_settings:
108
  model_group_alias:
109
  gpt-4o: gemini-2.5-flash-lite
110
  gpt-4.1-mini: gemini-2.5-flash-lite
111
- gpt-5-codex: kimi-k2.5
112
- gpt-5.1-codex: kimi-k2.5
 
103
  fallbacks:
104
  - v0: [gemini-2.5-flash-lite,gemini-2.5-flash]
105
  - kimi-k2.5: [gemini-2.5-flash-lite]
106
+ - claude-4.6-sonnet: [openrouter/claude-4.6-sonnet,openrouter/claude-4.5-sonnet,v0]
107
+ - claude-4.5-sonnet: [openrouter/claude-4.5-sonnet,v0]
108
+
109
  # - gemini-2.5-flash: [gemini-2.5-flash-lite]
110
+
111
  router_settings:
112
  model_group_alias:
113
  gpt-4o: gemini-2.5-flash-lite
114
  gpt-4.1-mini: gemini-2.5-flash-lite
115
+ gpt-5-codex: claude-4.5-sonnet
116
+ gpt-5.1-codex: claude-4.5-sonnet