chat-ui-energy

Paused

nsarrazin commited on Oct 16, 2024

Commit

c5ee468

unverified ·

1 Parent(s): dc6961c

feat(models): add `nvidia/Llama-3.1-Nemotron-70B-Instruct-HF` (#1527)

Files changed (2) hide show

chart/env/prod.yaml CHANGED Viewed

@@ -137,6 +137,23 @@ envVars:
           }
         ]
       },
       {
         "name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
         "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",

           }
         ]
       },
+      {
+        "name": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
+        "modelUrl": "https://huggingface.co/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
+        "websiteUrl": "https://www.nvidia.com/",
+        "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/nvidia-logo.png",
+        "description": "Nvidia's latest Llama fine-tune, topping alignment benchmarks and optimized for instruction following.",
+        "parameters": {
+          "stop": ["<|eot_id|>"],
+          "temperature": 0.6,
+          "truncate": 28672,
+          "max_new_tokens": 2048
+        },
+        "endpoint": {
+          "type": "openai",
+          "baseURL": "https://api-inference.huggingface.co/models/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF/v1"
+        }
+      },
       {
         "name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
         "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",

src/lib/server/models.ts CHANGED Viewed

@@ -319,7 +319,13 @@ const hasInferenceAPI = async (m: Awaited<ReturnType<typeof processModel>>) => {
 		return false;
 	}
-	const r = await fetch(`https://huggingface.co/api/models/${m.id}`);
 	if (!r.ok) {
 		logger.warn(`Failed to check if ${m.id} has inference API: ${r.statusText}`);

 		return false;
 	}
+	let r: Response;
+	try {
+		r = await fetch(`https://huggingface.co/api/models/${m.id}`);
+	} catch (e) {
+		console.log(e);
+		return false;
+	}
 	if (!r.ok) {
 		logger.warn(`Failed to check if ${m.id} has inference API: ${r.statusText}`);