Spaces:

winbeau
/

paper-insight-api

Sleeping

App Files Files Community

paper-insight-api / app /services /dify_client.py

winbeau

Backend snapshot from 760fa78

353b9f4 about 1 month ago

raw

history blame contribute delete

11.5 kB

	"""
	Dify Workflow API Client with Streaming Support.

	This module replaces the DeepSeek direct API calls with Dify Chatflow API,
	supporting streaming responses for long-running R1 reasoning processes.
	"""

	import os
	import json
	import httpx
	from typing import Optional, AsyncGenerator, Dict, Any
	from dataclasses import dataclass
	from dotenv import load_dotenv

	from app.models import LLMAnalysis

	load_dotenv()


	@dataclass
	class DifyStreamEvent:
	"""Represents a single event from Dify's streaming response."""
	event: str
	data: Dict[str, Any]
	thought: Optional[str] = None
	answer: Optional[str] = None
	outputs: Optional[Dict[str, Any]] = None


	@dataclass
	class TechnicalMapping:
	"""Technical mapping analysis from Dify workflow."""
	token_vs_patch: str = ""
	temporal_logic: str = ""
	frequency_domain: str = ""


	@dataclass
	class DifyAnalysisResult:
	"""Complete analysis result from Dify workflow."""
	summary_zh: str
	relevance_score: float
	relevance_reason: str
	technical_mapping: TechnicalMapping
	heuristic_idea: str
	thought_process: Optional[str] = None # R1 thinking process


	class DifyClientError(Exception):
	"""Base exception for Dify client errors."""
	pass


	class DifyEntityTooLargeError(DifyClientError):
	"""Raised when request payload exceeds Dify's limit (413)."""
	pass


	class DifyTimeoutError(DifyClientError):
	"""Raised when request times out."""
	pass


	class DifyRateLimitError(DifyClientError):
	"""Raised when rate limit is exceeded (429)."""
	pass


	class DifyClient:
	"""Dify Chatflow API client with streaming support."""

	def __init__(self):
	self.api_key = os.getenv("DIFY_API_KEY")
	if not self.api_key:
	raise ValueError("DIFY_API_KEY environment variable is not set")

	self.base_url = os.getenv("DIFY_API_BASE", "http://82.157.209.193:8080/v1")
	self.endpoint = f"{self.base_url}/chat-messages"
	self.timeout = httpx.Timeout(120.0, connect=10.0) # 2 min for R1 reasoning

	def _format_query(
	self,
	topic: str,
	background: str,
	method: str,
	contribution: str,
	) -> str:
	"""Format input according to Dify workflow variable specification."""
	return f"""研究主题：{topic}
	技术背景：{background}
	核心方法：{method}
	预期贡献：{contribution}"""

	def _build_request_body(
	self,
	query: str,
	user_id: str = "paper-insight-user",
	conversation_id: Optional[str] = None,
	) -> Dict[str, Any]:
	"""Build the request body for Dify API."""
	body = {
	"inputs": {
	"query": query,
	},
	"query": query, # Also send as direct query for compatibility
	"response_mode": "streaming",
	"user": user_id,
	}

	if conversation_id:
	body["conversation_id"] = conversation_id

	return body

	def _get_headers(self) -> Dict[str, str]:
	"""Get request headers with authentication."""
	return {
	"Authorization": f"Bearer {self.api_key}",
	"Content-Type": "application/json",
	}

	async def analyze_paper_stream(
	self,
	title: str,
	abstract: str,
	user_id: str = "paper-insight-user",
	) -> AsyncGenerator[DifyStreamEvent, None]:
	"""
	Analyze a paper using Dify workflow with streaming.

	Yields DifyStreamEvent objects for each SSE event received.
	"""
	# Format the query using paper information
	query = self._format_query(
	topic=title,
	background="arXiv论文，需要分析其与DiT/KV Cache研究的相关性",
	method=abstract[:500] if len(abstract) > 500 else abstract,
	contribution="待分析",
	)

	body = self._build_request_body(query, user_id)
	headers = self._get_headers()

	async with httpx.AsyncClient(timeout=self.timeout) as client:
	try:
	async with client.stream(
	"POST",
	self.endpoint,
	json=body,
	headers=headers,
	) as response:
	# Handle error responses
	if response.status_code == 413:
	raise DifyEntityTooLargeError(
	"Request payload too large. Consider shortening the abstract."
	)
	elif response.status_code == 429:
	raise DifyRateLimitError(
	"Rate limit exceeded. Please try again later."
	)
	elif response.status_code >= 400:
	error_text = await response.aread()
	raise DifyClientError(
	f"Dify API error {response.status_code}: {error_text.decode()}"
	)

	# Parse SSE stream
	buffer = ""
	async for chunk in response.aiter_text():
	buffer += chunk
	# Process complete SSE events
	while "\n\n" in buffer:
	event_str, buffer = buffer.split("\n\n", 1)
	event = self._parse_sse_event(event_str)
	if event:
	yield event

	except httpx.TimeoutException as e:
	raise DifyTimeoutError(f"Request timed out: {e}")
	except httpx.RequestError as e:
	raise DifyClientError(f"Request failed: {e}")

	def _parse_sse_event(self, event_str: str) -> Optional[DifyStreamEvent]:
	"""Parse a single SSE event string into DifyStreamEvent."""
	lines = event_str.strip().split("\n")
	event_type = ""
	data_str = ""

	for line in lines:
	if line.startswith("event:"):
	event_type = line[6:].strip()
	elif line.startswith("data:"):
	data_str = line[5:].strip()

	if not data_str:
	return None

	try:
	data = json.loads(data_str)
	except json.JSONDecodeError:
	return None

	event = DifyStreamEvent(
	event=event_type or data.get("event", ""),
	data=data,
	)

	# Extract common fields
	if "thought" in data:
	event.thought = data["thought"]
	if "answer" in data:
	event.answer = data["answer"]
	if "outputs" in data:
	event.outputs = data["outputs"]

	return event

	async def analyze_paper(
	self,
	title: str,
	abstract: str,
	user_id: str = "paper-insight-user",
	) -> Optional[DifyAnalysisResult]:
	"""
	Analyze a paper and return the complete result.

	This method consumes the entire stream and returns the final result.
	Use analyze_paper_stream() for real-time streaming updates.
	"""
	thought_parts = []
	answer_parts = []
	final_outputs = None

	try:
	async for event in self.analyze_paper_stream(title, abstract, user_id):
	if event.thought:
	thought_parts.append(event.thought)
	if event.answer:
	answer_parts.append(event.answer)
	if event.outputs:
	final_outputs = event.outputs

	# Check for workflow completion
	if event.event == "workflow_finished" and event.outputs:
	final_outputs = event.outputs

	# Parse the final outputs
	if final_outputs:
	return self._parse_outputs(final_outputs, "".join(thought_parts))

	# Try to parse from answer if outputs not available
	full_answer = "".join(answer_parts)
	if full_answer:
	return self._parse_answer(full_answer, "".join(thought_parts))

	return None

	except DifyClientError as e:
	print(f"Dify analysis error: {e}")
	return None

	def _parse_outputs(
	self,
	outputs: Dict[str, Any],
	thought_process: str = "",
	) -> DifyAnalysisResult:
	"""Parse Dify workflow outputs into DifyAnalysisResult."""
	technical_mapping = TechnicalMapping()
	if "technical_mapping" in outputs:
	tm = outputs["technical_mapping"]
	if isinstance(tm, dict):
	technical_mapping = TechnicalMapping(
	token_vs_patch=tm.get("token_vs_patch", ""),
	temporal_logic=tm.get("temporal_logic", ""),
	frequency_domain=tm.get("frequency_domain", ""),
	)

	return DifyAnalysisResult(
	summary_zh=outputs.get("summary_zh", ""),
	relevance_score=float(outputs.get("relevance_score", 0)),
	relevance_reason=outputs.get("relevance_reason", ""),
	technical_mapping=technical_mapping,
	heuristic_idea=outputs.get("heuristic_idea", ""),
	thought_process=thought_process if thought_process else None,
	)

	def _parse_answer(
	self,
	answer: str,
	thought_process: str = "",
	) -> Optional[DifyAnalysisResult]:
	"""Parse answer string (JSON) into DifyAnalysisResult."""
	try:
	data = json.loads(answer)
	return self._parse_outputs(data, thought_process)
	except json.JSONDecodeError:
	# If not JSON, try to extract fields manually
	return DifyAnalysisResult(
	summary_zh=answer[:200] if answer else "",
	relevance_score=0,
	relevance_reason="无法解析结构化输出",
	technical_mapping=TechnicalMapping(),
	heuristic_idea="",
	thought_process=thought_process if thought_process else None,
	)

	def to_llm_analysis(self, result: DifyAnalysisResult) -> LLMAnalysis:
	"""Convert DifyAnalysisResult to legacy LLMAnalysis model."""
	# Combine technical mapping into heuristic_idea for backward compatibility
	tech_mapping_str = ""
	if result.technical_mapping:
	parts = []
	if result.technical_mapping.token_vs_patch:
	parts.append(f"Token/Patch映射: {result.technical_mapping.token_vs_patch}")
	if result.technical_mapping.temporal_logic:
	parts.append(f"时序逻辑: {result.technical_mapping.temporal_logic}")
	if result.technical_mapping.frequency_domain:
	parts.append(f"频域分析: {result.technical_mapping.frequency_domain}")
	if parts:
	tech_mapping_str = "\n\n【技术映射】\n" + "\n".join(parts)

	heuristic_with_mapping = result.heuristic_idea + tech_mapping_str

	return LLMAnalysis(
	summary_zh=result.summary_zh,
	relevance_score=result.relevance_score,
	relevance_reason=result.relevance_reason,
	heuristic_idea=heuristic_with_mapping,
	)


	# Singleton instance
	_dify_client: Optional[DifyClient] = None


	def get_dify_client() -> DifyClient:
	"""Get or create DifyClient singleton."""
	global _dify_client
	if _dify_client is None:
	_dify_client = DifyClient()
	return _dify_client