Spaces:

purpleriann
/

LLM-Engineers-Handbook

Runtime error

Upload folder using huggingface_hub

a22e84b verified 8 months ago

1.18 kB

	from __future__ import annotations

	from llm_engineering.domain.inference import Inference
	from llm_engineering.settings import settings


	class InferenceExecutor:
	def __init__(
	self,
	llm: Inference,
	query: str,
	context: str \| None = None,
	prompt: str \| None = None,
	) -> None:
	self.llm = llm
	self.query = query
	self.context = context if context else ""

	if prompt is None:
	self.prompt = """
	You are a content creator. Write what the user asked you to while using the provided context as the primary source of information for the content.
	User query: {query}
	Context: {context}
	"""
	else:
	self.prompt = prompt

	def execute(self) -> str:
	self.llm.set_payload(
	inputs=self.prompt.format(query=self.query, context=self.context),
	parameters={
	"max_new_tokens": settings.MAX_NEW_TOKENS_INFERENCE,
	"repetition_penalty": 1.1,
	"temperature": settings.TEMPERATURE_INFERENCE,
	},
	)
	answer = self.llm.inference()[0]["generated_text"]

	return answer