Spaces:
Running
Running
File size: 5,412 Bytes
4ac7321 3c4b7ed 4ac7321 ac50b0e 4ac7321 ac50b0e 0294dcd 4ac7321 244889b 4ac7321 afbe0de 4ac7321 a11801f 6a5e4c9 726db95 ff0caae 4ac7321 48059af 4ac7321 d947276 a954f65 51b7de0 a954f65 51b7de0 a954f65 51b7de0 a954f65 9111ea7 a954f65 9111ea7 a954f65 9111ea7 21ed304 7139d72 9111ea7 bb8ac6e a954f65 4ac7321 09fe08f 28954fa 09fe08f 28954fa 09fe08f 4ac7321 14ef8d0 4ac7321 4906f37 244889b 4906f37 3471d51 3f6a443 4ac7321 3f6a443 4ac7321 de0d97b 4ac7321 c6b0d3e f3b8d77 c6b0d3e | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 | image:
repository: huggingface
name: chat-ui
nodeSelector:
role-huggingchat: "true"
tolerations:
- key: "huggingface.co/huggingchat"
operator: "Equal"
value: "true"
effect: "NoSchedule"
serviceAccount:
enabled: true
create: true
name: huggingchat-prod
ingress:
path: "/chat"
annotations:
alb.ingress.kubernetes.io/healthcheck-path: "/healthcheck"
alb.ingress.kubernetes.io/listen-ports: "[{\"HTTP\": 80}, {\"HTTPS\": 443}]"
alb.ingress.kubernetes.io/group.name: "hub-prod"
alb.ingress.kubernetes.io/scheme: "internet-facing"
alb.ingress.kubernetes.io/ssl-redirect: "443"
alb.ingress.kubernetes.io/tags: "Env=prod,Project=hub,Terraform=true"
alb.ingress.kubernetes.io/target-node-labels: "role-hub-utils=true"
kubernetes.io/ingress.class: "alb"
ingressInternal:
enabled: true
path: "/chat"
annotations:
alb.ingress.kubernetes.io/group.name: hub-prod-internal-public
alb.ingress.kubernetes.io/healthcheck-path: "/healthcheck"
alb.ingress.kubernetes.io/listen-ports: "[{\"HTTP\": 80}, {\"HTTPS\": 443}]"
alb.ingress.kubernetes.io/load-balancer-name: hub-prod-internal-public
alb.ingress.kubernetes.io/target-group-attributes: deregistration_delay.timeout_seconds=30
alb.ingress.kubernetes.io/target-node-labels: role-hub-lb=true
alb.ingress.kubernetes.io/target-type: ip
kubernetes.io/ingress.class: "alb"
envVars:
ADMIN_CLI_LOGIN: "false"
ALTERNATIVE_REDIRECT_URLS: '["huggingchat://login/callback"]'
APP_BASE: "/chat"
ALLOW_IFRAME: "false"
COMMUNITY_TOOLS: "true"
COOKIE_SAMESITE: "lax"
COOKIE_SECURE: "true"
ENABLE_ASSISTANTS: "true"
ENABLE_CONFIG_MANAGER: "false"
LOG_LEVEL: "debug"
NODE_ENV: "prod"
NODE_LOG_STRUCTURED_DATA: true
OLD_MODELS: >
[
{ "name": "bigcode/starcoder" },
{ "name": "OpenAssistant/oasst-sft-6-llama-30b-xor" },
{ "name": "HuggingFaceH4/zephyr-7b-alpha" },
{ "name": "openchat/openchat_3.5" },
{ "name": "openchat/openchat-3.5-1210" },
{ "name": "tiiuae/falcon-180B-chat" },
{ "name": "codellama/CodeLlama-34b-Instruct-hf" },
{ "name": "google/gemma-7b-it" },
{ "name": "meta-llama/Llama-2-70b-chat-hf" },
{ "name": "codellama/CodeLlama-70b-Instruct-hf" },
{ "name": "openchat/openchat-3.5-0106" },
{ "name": "meta-llama/Meta-Llama-3-70B-Instruct" },
{ "name": "meta-llama/Meta-Llama-3.1-405B-Instruct-FP8" },
{
"name": "CohereForAI/c4ai-command-r-plus-08-2024",
"transferTo": "CohereLabs/c4ai-command-r-plus-08-2024"
},
{
"name": "CohereForAI/c4ai-command-r-plus",
"transferTo": "CohereLabs/c4ai-command-r-plus-08-2024"
},
{
"name": "01-ai/Yi-1.5-34B-Chat",
"transferTo": "CohereLabs/c4ai-command-r-plus-08-2024"
},
{
"name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
"transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
},
{
"name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
"transferTo": "NousResearch/Hermes-3-Llama-3.1-8B"
},
{
"name": "mistralai/Mistral-7B-Instruct-v0.3",
"transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
},
{
"name": "microsoft/Phi-3-mini-4k-instruct",
"transferTo": "microsoft/Phi-4"
},
{
"name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
"transferTo": "meta-llama/Llama-3.3-70B-Instruct"
},
{
"name": "Qwen/QwQ-32B-Preview",
"transferTo": "Qwen/QwQ-32B"
},
{
"name": "mistralai/Mistral-Nemo-Instruct-2407",
"transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
},
{
"name": "microsoft/Phi-3.5-mini-instruct",
"transferTo": "microsoft/Phi-4"
},
{
"name": "Qwen/Qwen2.5-Coder-32B-Instruct",
"transferTo": "Qwen/QwQ-32B"
},
{
"name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
"transferTo" : "Qwen/Qwen2.5-VL-32B-Instruct"
}
]
PUBLIC_ORIGIN: "https://huggingface.co"
PUBLIC_SHARE_PREFIX: "https://hf.co/chat"
PUBLIC_ANNOUNCEMENT_BANNERS: >
[
{
"title": "Qwen 3 235B is available!",
"linkTitle": "Try it out!",
"linkHref": "https://huggingface.co/chat/models/Qwen/Qwen3-235B-A22B"
}
]
PUBLIC_APP_NAME: "HuggingChat"
PUBLIC_APP_ASSETS: "huggingchat"
PUBLIC_APP_COLOR: "yellow"
PUBLIC_APP_DESCRIPTION: "Making the community's best AI chat models available to everyone."
PUBLIC_APP_GUEST_MESSAGE: "Sign in with a free Hugging Face account to continue using HuggingChat."
PUBLIC_APP_DATA_SHARING: 0
PUBLIC_PLAUSIBLE_SCRIPT_URL: "/js/script.js"
TASK_MODEL: >
{
"name": "NousResearch/Hermes-3-Llama-3.1-8B",
"unlisted": true,
"endpoints": [{"type" : "inference-client"}],
"parameters": {
"temperature": 0.1,
"max_new_tokens": 256
}
}
HF_ORG_ADMIN: '644171cfbd0c97265298aa99'
HF_ORG_EARLY_ACCESS: '5e67bd5b1009063689407478'
infisical:
enabled: true
env: "prod-us-east-1"
autoscaling:
enabled: true
minReplicas: 2
maxReplicas: 30
targetMemoryUtilizationPercentage: "50"
targetCPUUtilizationPercentage: "50"
resources:
requests:
cpu: 2
memory: 4Gi
limits:
cpu: 4
memory: 8Gi
|