Spaces:

mishrabp
/

deep-research

Sleeping

App Files Files Community

deep-research / common /utility /llm_factory2.py

mishrabp

Upload folder using huggingface_hub

d06c4bf verified 5 months ago

raw

history blame contribute delete

2.63 kB

	import os
	import tiktoken
	from typing import Union
	# from azure.identity import DefaultAzureCredential
	from langchain_openai.chat_models import AzureChatOpenAI, ChatOpenAI


	class LLMFactory:
	"""
	A static utility class to create and return LLM instances based on the input type.
	"""

	@staticmethod
	def get_llm(llm_type: str) -> Union[AzureChatOpenAI, ChatOpenAI]:
	"""
	Returns an LLM instance based on the specified type.

	Parameters:
	llm_type (str): The type of LLM to return. Valid values are 'azure' or 'openai'.

	Returns:
	Union[AzureChatOpenAI, ChatOpenAI]: The LLM instance.
	"""
	if llm_type.lower() == "azure":
	# # Get the Azure Credential
	# credential = DefaultAzureCredential()
	# token=credential.get_token("https://cognitiveservices.azure.com/.default").token

	# if not token:
	# raise ValueError("Token is required for AzureChatOpenAI.")
	# return AzureChatOpenAI(
	# azure_endpoint=os.environ["AZURE_OPENAI_API_URI"],
	# azure_deployment=os.environ["AZURE_OPENAI_API_BASE_MODEL"],
	# api_version=os.environ["AZURE_OPENAI_API_VERSION"],
	# api_key=token
	# )
	pass
	elif llm_type.lower() == "openai":
	return ChatOpenAI(
	api_key=os.environ["OPENAI_API_KEY"],
	model_name="gpt-4"
	)
	elif llm_type.lower() == "openai_chat":
	return ChatOpenAI(
	api_key=os.environ["OPENAI_API_KEY"],
	model_name="gpt-4"
	)
	else:
	raise ValueError("Invalid llm_type. Use 'azure' or 'openai'.")

	@staticmethod
	def num_tokens_from_messages(messages):

	"""
	Return the number of tokens used by a list of messages.
	Adapted from the Open AI cookbook token counter
	"""

	encoding = tiktoken.encoding_for_model("gpt-3.5-turbo")

	# Each message is sandwiched with <\|start\|>role and <\|end\|>
	# Hence, messages look like: <\|start\|>system or user or assistant{message}<\|end\|>

	tokens_per_message = 3 # token1:<\|start\|>, token2:system(or user or assistant), token3:<\|end\|>

	num_tokens = 0

	for message in messages:
	num_tokens += tokens_per_message
	for key, value in message.items():
	num_tokens += len(encoding.encode(value))

	num_tokens += 3 # every reply is primed with <\|start\|>assistant<\|message\|>

	return num_tokens