Spaces:

soupstick
/

fraud-detector-app

Sleeping

App Files Files Community

fraud-detector-app / models.py

soupstick

fix: update app file

cc8732a 6 months ago

raw

history blame contribute delete

4.8 kB

	"""
	Model routing and management for fraud detection
	"""
	import logging
	from typing import Optional, Dict, Any
	from huggingface_hub import InferenceClient

	logger = logging.getLogger(__name__)

	class ModelRouter:
	"""Routes requests to appropriate models based on task type"""

	def __init__(self, hf_token: str):
	self.hf_token = hf_token
	# Updated model names - using more reliable models
	self.models = {
	"analysis": "mistralai/Mistral-7B-Instruct-v0.2", # More stable model
	"coding": "Qwen/Qwen2.5-Coder-32B-Instruct"
	}
	self.clients = {}
	self._init_clients()

	def _init_clients(self):
	"""Initialize model clients"""
	for task, model_name in self.models.items():
	try:
	if self.hf_token:
	# Add timeout for better error handling
	self.clients[task] = InferenceClient(
	model=model_name,
	token=self.hf_token,
	timeout=60
	)
	logger.info(f"Initialized client for {task}: {model_name}")
	else:
	logger.warning(f"No HF token provided, {task} model will not be available")
	except Exception as e:
	logger.error(f"Failed to initialize {task} client: {e}")

	def run(self, prompt: str, task: str = "analysis", max_tokens: int = 500) -> str:
	"""Run inference with specified task model"""
	if task not in self.clients:
	return f"Model for task '{task}' not available. Please check HF_TOKEN."

	try:
	client = self.clients[task]

	# Try chat completion first (preferred for instruction models)
	try:
	messages = [
	{"role": "system", "content": "You are a helpful fraud detection analyst AI. Be concise, clear, and practical."},
	{"role": "user", "content": prompt}
	]

	response = client.chat_completion(
	messages=messages,
	max_tokens=max_tokens,
	temperature=0.7
	)

	# Extract text from response
	if hasattr(response, 'choices') and len(response.choices) > 0:
	return response.choices[0].message.content.strip()
	elif isinstance(response, dict) and 'choices' in response:
	return response['choices'][0]['message']['content'].strip()
	else:
	return str(response).strip()

	except Exception as chat_error:
	logger.warning(f"Chat completion failed, trying text generation: {chat_error}")

	# Fallback to text generation
	response = client.text_generation(
	prompt,
	max_new_tokens=max_tokens,
	temperature=0.7,
	do_sample=True,
	return_full_text=False
	)

	# Handle different response types
	if isinstance(response, str):
	return response.strip()
	elif hasattr(response, 'generated_text'):
	return response.generated_text.strip()
	else:
	return str(response).strip()

	except Exception as e:
	error_msg = f"Error running {task} model: {str(e)}"
	logger.error(error_msg)

	# Return a more helpful fallback message
	return f"""
	🔍 FRAUD ANALYSIS REPORT (Fallback Mode)
	📊 Analysis could not be completed with AI model, but fraud detection algorithms ran successfully.
	⚠️ Please check the flagged transactions below for manual review.
	🎯 Recommended: Review all flagged transactions and consider implementing additional monitoring.
	""".strip()

	def get_available_models(self) -> Dict[str, str]:
	"""Get list of available models"""
	return {task: model for task, model in self.models.items() if task in self.clients}

	def health_check(self) -> Dict[str, bool]:
	"""Check if models are working"""
	status = {}
	for task, client in self.clients.items():
	try:
	# Simple test prompt
	test_response = client.text_generation("Hello", max_new_tokens=10)
	status[task] = True
	except Exception as e:
	logger.error(f"Health check failed for {task}: {e}")
	status[task] = False
	return status