Spaces:

jackkuo
/

ADMP-LS

Sleeping

App Files Files Community

ADMP-LS / client /services /ai_service.py

jackkuo

reinit repo

82bf89e 4 months ago

raw

history blame contribute delete

5.06 kB

	import streamlit as st

	from langchain_core.messages import HumanMessage, SystemMessage
	from langchain_aws import ChatBedrock
	from langchain_openai import ChatOpenAI
	from langchain_groq import ChatGroq
	from langchain_anthropic import ChatAnthropic
	from langchain_google_genai import ChatGoogleGenerativeAI

	from typing import Optional
	from config import MODEL_OPTIONS


	def create_llm_model(llm_provider: str, **kwargs):
	"""Create a language model based on the selected provider."""
	params = st.session_state.get('params')

	if llm_provider == "OpenAI":
	return ChatOpenAI(
	base_url=params.get("base_url"),
	openai_api_key=params.get("api_key"),
	model=MODEL_OPTIONS['OpenAI'],
	temperature=kwargs.get('temperature', 0.7),
	)
	elif llm_provider == "Antropic":
	return ChatAnthropic(
	base_url=params.get("base_url"),
	anthropic_api_key=params.get("api_key"),
	model=MODEL_OPTIONS['Antropic'],
	temperature=kwargs.get('temperature', 0.7),
	)
	elif llm_provider == "Bedrock":
	import boto3
	# Initialize Bedrock client
	_bedrock = boto3.client(
	'bedrock-runtime',
	region_name=params.get("region_name"),
	aws_access_key_id=params.get("aws_access_key"),
	aws_secret_access_key=params.get("aws_secret_key"),
	)
	return ChatBedrock(
	client=_bedrock,
	model_id=MODEL_OPTIONS['Bedrock'],
	**kwargs
	)

	elif llm_provider == "Google":
	return ChatGoogleGenerativeAI(
	google_api_key=params.get("api_key"),
	model=MODEL_OPTIONS['Google'],
	temperature=kwargs.get('temperature', 0.7),
	max_tokens=kwargs.get('max_tokens', 4096),
	max_retries=2,
	)
	elif llm_provider == "Groq":
	return ChatGroq(
	api_key=params.get("api_key"), # groq_api_key expected here
	model=MODEL_OPTIONS['Groq'],
	temperature=kwargs.get("temperature", 0.7),
	streaming=kwargs.get("streaming", False)
	)
	else:
	raise ValueError(f"Unsupported LLM provider: {llm_provider}")


	def get_response(prompt: str, llm_provider: str):
	"""Get a response from the LLM using the standard LangChain interface."""
	try:
	# Create the LLM instance dynamically
	llm = create_llm_model(llm_provider)

	# Wrap prompt in a HumanMessage
	message = HumanMessage(content=prompt)

	# Invoke model and return the output content
	response = llm.invoke([message])
	return response.content

	except Exception as e:
	return f"Error during LLM invocation: {str(e)}"

	def get_response_stream(
	prompt: str,
	llm_provider: str,
	system: Optional[str] = '',
	temperature: float = 1.0,
	max_tokens: int = 4096,
	**kwargs,
	):
	"""
	Get a streaming response from the selected LLM provider.
	All provider-specific connection/auth should be handled via kwargs.
	"""
	try:
	# Add streaming and generation params to kwargs
	kwargs.update({
	"temperature": temperature,
	"max_tokens": max_tokens,
	"streaming": True
	})

	# Create the LLM with streaming enabled
	llm = create_llm_model(llm_provider, **kwargs)

	# Compose messages
	messages = []
	if system:
	messages.append(SystemMessage(content=system))
	messages.append(HumanMessage(content=prompt))

	# Stream the response
	stream_response = llm.stream(messages)
	return stream_response
	except Exception as e:
	st.error(f"[Error during streaming: {str(e)}]")
	st.stop()


	def test_llm_connection(llm_provider: str, test_params: dict = None):
	"""
	Test the connection to the specified LLM provider.
	Returns a tuple of (success: bool, message: str)
	"""
	try:
	# Use test_params if provided, otherwise use session state
	if test_params:
	# Temporarily store original params
	original_params = st.session_state.get('params', {})
	# Set test params
	st.session_state['params'] = test_params

	# Create LLM instance
	llm = create_llm_model(llm_provider)

	# Test with a simple message
	test_message = HumanMessage(content="Hello, this is a connection test. Please respond with 'OK'.")
	response = llm.invoke([test_message])

	# Restore original params if we used test_params
	if test_params:
	st.session_state['params'] = original_params

	return True, f"✅ Connection successful! Model response: {response.content[:100]}..."

	except Exception as e:
	# Restore original params if we used test_params
	if test_params:
	st.session_state['params'] = original_params
	return False, f"❌ Connection failed: {str(e)}"