ai-lab-tube

Sleeping

ai-lab-tube / src /app /api /providers /huggingface /predictWithHuggingFace.ts

Julian Bilcke

remove stdout

cf329f1 almost 2 years ago

2.75 kB


	import { HfInference } from "@huggingface/inference"

	import { createZephyrPrompt } from "@/lib/prompts/createZephyrPrompt"

	import { LLMPredictionFunctionParams } from "../types"

	export async function predict({
	systemPrompt,
	userPrompt,
	nbMaxNewTokens,
	turbo,
	prefix,
	}: LLMPredictionFunctionParams): Promise<string> {

	const hf = new HfInference(process.env.ADMIN_HUGGING_FACE_API_TOKEN)

	let instructions = ""
	try {
	for await (const output of hf.textGenerationStream({
	// model: "mistralai/Mixtral-8x7B-v0.1",
	model:
	turbo
	? "HuggingFaceH4/zephyr-7b-beta"
	: "mistralai/Mixtral-8x7B-Instruct-v0.1",
	inputs: createZephyrPrompt([
	{ role: "system", content: systemPrompt },
	{ role: "user", content: userPrompt }
	]) + '\n' + prefix,

	parameters: {
	do_sample: true,
	max_new_tokens: nbMaxNewTokens,
	return_full_text: false,
	}
	})) {
	instructions += output.token.text
	// process.stdout.write(output.token.text)
	if (
	instructions.includes("# Final") \|\|
	instructions.includes("# Guidelines") \|\|
	instructions.includes("</s>") \|\|
	instructions.includes("<s>") \|\|
	instructions.includes("/s>") \|\|
	instructions.includes("[INST]") \|\|
	instructions.includes("[/INST]") \|\|
	instructions.includes("<SYS>") \|\|
	instructions.includes("<<SYS>>") \|\|
	instructions.includes("</SYS>") \|\|
	instructions.includes("<</SYS>>") \|\|
	instructions.includes("<\|user\|>") \|\|
	instructions.includes("<\|end\|>") \|\|
	instructions.includes("<\|system\|>") \|\|
	instructions.includes("<\|assistant\|>")
	) {
	break
	}
	}
	} catch (err) {
	// console.error(`error during generation: ${err}`)

	// a common issue with Llama-2 might be that the model receives too many requests
	if (`${err}` === "Error: Model is overloaded") {
	instructions = ``
	}
	}

	// need to do some cleanup of the garbage the LLM might have gave us
	let result =
	instructions
	.replaceAll("# Final", "")
	.replaceAll("# Guidelines", "")
	.replaceAll("<\|end\|>", "")
	.replaceAll("<s>", "")
	.replaceAll("</s>", "")
	.replaceAll("/s>", "")
	.replaceAll("[INST]", "")
	.replaceAll("[/INST]", "")
	.replaceAll("<SYS>", "")
	.replaceAll("<<SYS>>", "")
	.replaceAll("</SYS>", "")
	.replaceAll("<</SYS>>", "")
	.replaceAll("<\|system\|>", "")
	.replaceAll("<\|user\|>", "")
	.replaceAll("<\|all\|>", "")
	.replaceAll("<\|assistant\|>", "")
	.replaceAll('""', '"')
	.trim()

	if (prefix && !result.startsWith(prefix)) {
	result = prefix + result
	}

	return result
	}