Spaces:

coco1990
/

Snap-Solver

Sleeping

Snap-Solver / models /anthropic.py

renxsh

init

f1b4581 2 months ago

15.9 kB

	import json
	import requests
	from typing import Generator, Optional
	from .base import BaseModel

	class AnthropicModel(BaseModel):
	def __init__(self, api_key, temperature=0.7, system_prompt=None, language=None, api_base_url=None, model_identifier=None):
	super().__init__(api_key, temperature, system_prompt or self.get_default_system_prompt(), language or "en")
	# 设置API基础URL，默认为Anthropic官方API
	self.api_base_url = api_base_url or "https://api.anthropic.com/v1"
	# 设置模型标识符，支持动态选择
	self.model_identifier = model_identifier or "claude-3-7-sonnet-20250219"
	# 初始化推理配置
	self.reasoning_config = None
	# 初始化最大Token数
	self.max_tokens = None

	def get_default_system_prompt(self) -> str:
	return """You are an expert at analyzing questions and providing detailed solutions. When presented with an image of a question:
	1. First read and understand the question carefully
	2. Break down the key components of the question
	3. Provide a clear, step-by-step solution
	4. If relevant, explain any concepts or theories involved
	5. If there are multiple approaches, explain the most efficient one first"""

	def get_model_identifier(self) -> str:
	return self.model_identifier

	def analyze_text(self, text: str, proxies: Optional[dict] = None) -> Generator[dict, None, None]:
	"""Stream Claude's response for text analysis"""
	try:
	yield {"status": "started"}

	api_key = self.api_key
	if api_key.startswith('Bearer '):
	api_key = api_key[7:]

	headers = {
	'x-api-key': api_key,
	'anthropic-version': '2023-06-01',
	'content-type': 'application/json',
	'accept': 'application/json',
	}

	# 获取最大输出Token设置
	max_tokens = 8192 # 默认值
	if hasattr(self, 'max_tokens') and self.max_tokens:
	max_tokens = self.max_tokens

	payload = {
	'model': self.get_model_identifier(),
	'stream': True,
	'max_tokens': max_tokens,
	'temperature': 1,
	'system': self.system_prompt,
	'messages': [{
	'role': 'user',
	'content': [
	{
	'type': 'text',
	'text': text
	}
	]
	}]
	}

	# 处理推理配置
	if hasattr(self, 'reasoning_config') and self.reasoning_config:
	# 如果设置了extended reasoning
	if self.reasoning_config.get('reasoning_depth') == 'extended':
	think_budget = self.reasoning_config.get('think_budget', max_tokens // 2)
	payload['thinking'] = {
	'type': 'enabled',
	'budget_tokens': think_budget
	}
	# 如果设置了instant模式
	elif self.reasoning_config.get('speed_mode') == 'instant':
	# 确保当使用speed_mode时不包含thinking参数
	if 'thinking' in payload:
	del payload['thinking']
	# 默认启用思考但使用较小的预算
	else:
	payload['thinking'] = {
	'type': 'enabled',
	'budget_tokens': min(4096, max_tokens // 4)
	}
	# 默认设置
	else:
	payload['thinking'] = {
	'type': 'enabled',
	'budget_tokens': min(4096, max_tokens // 4)
	}

	print(f"Debug - 推理配置: max_tokens={max_tokens}, thinking={payload.get('thinking', payload.get('speed_mode', 'default'))}")

	# 使用配置的API基础URL
	api_endpoint = f"{self.api_base_url}/messages"

	response = requests.post(
	api_endpoint,
	headers=headers,
	json=payload,
	stream=True,
	proxies=proxies,
	timeout=60
	)

	if response.status_code != 200:
	error_msg = f'API error: {response.status_code}'
	try:
	error_data = response.json()
	if 'error' in error_data:
	error_msg += f" - {error_data['error']['message']}"
	except:
	error_msg += f" - {response.text}"
	yield {"status": "error", "error": error_msg}
	return

	thinking_content = ""
	response_buffer = ""

	for chunk in response.iter_lines():
	if not chunk:
	continue

	try:
	chunk_str = chunk.decode('utf-8')
	if not chunk_str.startswith('data: '):
	continue

	chunk_str = chunk_str[6:]
	data = json.loads(chunk_str)

	if data.get('type') == 'content_block_delta':
	if 'delta' in data:
	if 'text' in data['delta']:
	text_chunk = data['delta']['text']
	response_buffer += text_chunk
	# 只在每累积一定数量的字符后才发送，减少UI跳变
	if len(text_chunk) >= 10 or text_chunk.endswith(('.', '!', '?', '。', '！', '？', '\n')):
	yield {
	"status": "streaming",
	"content": response_buffer
	}

	elif 'thinking' in data['delta']:
	thinking_chunk = data['delta']['thinking']
	thinking_content += thinking_chunk
	# 只在每累积一定数量的字符后才发送，减少UI跳变
	if len(thinking_chunk) >= 20 or thinking_chunk.endswith(('.', '!', '?', '。', '！', '？', '\n')):
	yield {
	"status": "thinking",
	"content": thinking_content
	}

	# 处理新的extended_thinking格式
	elif data.get('type') == 'extended_thinking_delta':
	if 'delta' in data and 'text' in data['delta']:
	thinking_chunk = data['delta']['text']
	thinking_content += thinking_chunk
	# 只在每累积一定数量的字符后才发送，减少UI跳变
	if len(thinking_chunk) >= 20 or thinking_chunk.endswith(('.', '!', '?', '。', '！', '？', '\n')):
	yield {
	"status": "thinking",
	"content": thinking_content
	}

	elif data.get('type') == 'message_stop':
	# 确保发送完整的思考内容
	if thinking_content:
	yield {
	"status": "thinking_complete",
	"content": thinking_content
	}
	# 确保发送完整的响应内容
	yield {
	"status": "completed",
	"content": response_buffer
	}

	elif data.get('type') == 'error':
	error_msg = data.get('error', {}).get('message', 'Unknown error')
	yield {
	"status": "error",
	"error": error_msg
	}
	break

	except json.JSONDecodeError as e:
	print(f"JSON decode error: {str(e)}")
	continue

	except Exception as e:
	yield {
	"status": "error",
	"error": f"Streaming error: {str(e)}"
	}

	def analyze_image(self, image_data, proxies: Optional[dict] = None):
	yield {"status": "started"}

	api_key = self.api_key
	if api_key.startswith('Bearer '):
	api_key = api_key[7:]

	headers = {
	'x-api-key': api_key,
	'anthropic-version': '2023-06-01',
	'content-type': 'application/json'
	}

	# 使用系统提供的系统提示词，不再自动添加语言指令
	system_prompt = self.system_prompt

	# 获取最大输出Token设置
	max_tokens = 8192 # 默认值
	if hasattr(self, 'max_tokens') and self.max_tokens:
	max_tokens = self.max_tokens

	payload = {
	'model': self.get_model_identifier(),
	'stream': True,
	'max_tokens': max_tokens,
	'temperature': 1,
	'system': system_prompt,
	'messages': [{
	'role': 'user',
	'content': [
	{
	'type': 'image',
	'source': {
	'type': 'base64',
	'media_type': 'image/png',
	'data': image_data
	}
	},
	{
	'type': 'text',
	'text': "请分析这个问题并提供详细的解决方案。如果你看到多个问题，请逐一解决。"
	}
	]
	}]
	}

	# 处理推理配置
	if hasattr(self, 'reasoning_config') and self.reasoning_config:
	# 如果设置了extended reasoning
	if self.reasoning_config.get('reasoning_depth') == 'extended':
	think_budget = self.reasoning_config.get('think_budget', max_tokens // 2)
	payload['thinking'] = {
	'type': 'enabled',
	'budget_tokens': think_budget
	}
	# 如果设置了instant模式
	elif self.reasoning_config.get('speed_mode') == 'instant':
	# 只需确保不包含thinking参数，不添加speed_mode参数
	if 'thinking' in payload:
	del payload['thinking']
	# 默认启用思考但使用较小的预算
	else:
	payload['thinking'] = {
	'type': 'enabled',
	'budget_tokens': min(4096, max_tokens // 4)
	}
	# 默认设置
	else:
	payload['thinking'] = {
	'type': 'enabled',
	'budget_tokens': min(4096, max_tokens // 4)
	}

	print(f"Debug - 图像分析推理配置: max_tokens={max_tokens}, thinking={payload.get('thinking', payload.get('speed_mode', 'default'))}")

	# 使用配置的API基础URL
	api_endpoint = f"{self.api_base_url}/messages"

	response = requests.post(
	api_endpoint,
	headers=headers,
	json=payload,
	stream=True,
	proxies=proxies,
	timeout=60
	)

	if response.status_code != 200:
	error_msg = f'API error: {response.status_code}'
	try:
	error_data = response.json()
	if 'error' in error_data:
	error_msg += f" - {error_data['error']['message']}"
	except:
	error_msg += f" - {response.text}"
	yield {"status": "error", "error": error_msg}
	return

	thinking_content = ""
	response_buffer = ""

	for chunk in response.iter_lines():
	if not chunk:
	continue

	try:
	chunk_str = chunk.decode('utf-8')
	if not chunk_str.startswith('data: '):
	continue

	chunk_str = chunk_str[6:]
	data = json.loads(chunk_str)

	if data.get('type') == 'content_block_delta':
	if 'delta' in data:
	if 'text' in data['delta']:
	text_chunk = data['delta']['text']
	response_buffer += text_chunk
	# 只在每累积一定数量的字符后才发送，减少UI跳变
	if len(text_chunk) >= 10 or text_chunk.endswith(('.', '!', '?', '。', '！', '？', '\n')):
	yield {
	"status": "streaming",
	"content": response_buffer
	}

	elif 'thinking' in data['delta']:
	thinking_chunk = data['delta']['thinking']
	thinking_content += thinking_chunk
	# 只在每累积一定数量的字符后才发送，减少UI跳变
	if len(thinking_chunk) >= 20 or thinking_chunk.endswith(('.', '!', '?', '。', '！', '？', '\n')):
	yield {
	"status": "thinking",
	"content": thinking_content
	}

	# 处理新的extended_thinking格式
	elif data.get('type') == 'extended_thinking_delta':
	if 'delta' in data and 'text' in data['delta']:
	thinking_chunk = data['delta']['text']
	thinking_content += thinking_chunk
	# 只在每累积一定数量的字符后才发送，减少UI跳变
	if len(thinking_chunk) >= 20 or thinking_chunk.endswith(('.', '!', '?', '。', '！', '？', '\n')):
	yield {
	"status": "thinking",
	"content": thinking_content
	}

	elif data.get('type') == 'message_stop':
	# 确保发送完整的思考内容
	if thinking_content:
	yield {
	"status": "thinking_complete",
	"content": thinking_content
	}
	# 确保发送完整的响应内容
	yield {
	"status": "completed",
	"content": response_buffer
	}

	elif data.get('type') == 'error':
	error_message = data.get('error', {}).get('message', 'Unknown error')
	yield {
	"status": "error",
	"error": error_message
	}

	except Exception as e:
	yield {
	"status": "error",
	"error": f"Error processing response: {str(e)}"
	}
	break