Spaces:

torxytonnicker
/

teste

Sleeping

App Files Files Community

teste / src /ai /voting_system.py

torxyton

feat: Implementa sistema ensemble avançado de IA com múltiplos modelos

215b833 6 months ago

raw

history blame contribute delete

23.8 kB

	#!/usr/bin/env python3
	# -- coding: utf-8 --
	"""
	Sistema de Votação Inteligente para Ensemble AI
	Otimiza decisões através de algoritmos avançados de consenso
	"""

	import numpy as np
	import logging
	from typing import Dict, List, Optional, Tuple, Any
	from dataclasses import dataclass
	from enum import Enum
	from datetime import datetime, timedelta
	import json
	from collections import defaultdict, deque
	import statistics

	class VotingStrategy(Enum):
	"""Estratégias de votação disponíveis"""
	SIMPLE_MAJORITY = "simple_majority"
	WEIGHTED_AVERAGE = "weighted_average"
	CONFIDENCE_WEIGHTED = "confidence_weighted"
	DYNAMIC_CONSENSUS = "dynamic_consensus"
	BAYESIAN_FUSION = "bayesian_fusion"
	ADAPTIVE_ENSEMBLE = "adaptive_ensemble"

	@dataclass
	class VoteResult:
	"""Resultado de uma votação"""
	decision: str
	confidence: float
	consensus_strength: float
	strategy_used: VotingStrategy
	individual_votes: List[Dict[str, Any]]
	metadata: Dict[str, Any]
	processing_time: float

	@dataclass
	class ModelPerformance:
	"""Métricas de performance de um modelo"""
	accuracy_history: deque
	recent_accuracy: float
	long_term_accuracy: float
	consistency_score: float
	response_time_avg: float
	last_updated: datetime

	class AdaptiveWeightCalculator:
	"""Calculadora de pesos adaptativos para modelos"""

	def __init__(self, window_size: int = 100):
	self.window_size = window_size
	self.performance_tracker = defaultdict(lambda: ModelPerformance(
	accuracy_history=deque(maxlen=window_size),
	recent_accuracy=0.5,
	long_term_accuracy=0.5,
	consistency_score=0.5,
	response_time_avg=1.0,
	last_updated=datetime.now()
	))
	self.market_conditions = {
	'volatility': 0.5,
	'trend_strength': 0.5,
	'volume_profile': 0.5
	}

	def update_performance(self, model_name: str, accuracy: float, response_time: float):
	"""Atualiza métricas de performance de um modelo"""
	perf = self.performance_tracker[model_name]

	# Adicionar nova accuracy
	perf.accuracy_history.append(accuracy)

	# Calcular métricas
	if len(perf.accuracy_history) >= 10:
	perf.recent_accuracy = np.mean(list(perf.accuracy_history)[-10:])
	else:
	perf.recent_accuracy = np.mean(list(perf.accuracy_history))

	perf.long_term_accuracy = np.mean(list(perf.accuracy_history))

	# Calcular consistência (inverso do desvio padrão)
	if len(perf.accuracy_history) >= 5:
	std_dev = np.std(list(perf.accuracy_history))
	perf.consistency_score = max(0.1, 1.0 - std_dev)

	# Atualizar tempo de resposta médio
	alpha = 0.1
	perf.response_time_avg = alpha * response_time + (1 - alpha) * perf.response_time_avg

	perf.last_updated = datetime.now()

	def calculate_adaptive_weights(self, model_names: List[str],
	market_context: Optional[Dict[str, float]] = None) -> Dict[str, float]:
	"""Calcula pesos adaptativos baseados em performance e contexto"""
	weights = {}

	# Atualizar condições de mercado se fornecidas
	if market_context:
	self.market_conditions.update(market_context)

	for model_name in model_names:
	perf = self.performance_tracker[model_name]

	# Peso base da accuracy recente
	accuracy_weight = perf.recent_accuracy

	# Ajuste por consistência
	consistency_factor = perf.consistency_score

	# Ajuste por tempo de resposta (modelos mais rápidos têm vantagem)
	speed_factor = min(2.0, 2.0 / max(0.1, perf.response_time_avg))

	# Ajuste por condições de mercado
	market_factor = self._calculate_market_adjustment(model_name)

	# Peso final
	final_weight = accuracy_weight * consistency_factor * speed_factor * market_factor
	weights[model_name] = max(0.1, min(2.0, final_weight)) # Limitar entre 0.1 e 2.0

	# Normalizar pesos
	total_weight = sum(weights.values())
	if total_weight > 0:
	weights = {k: v / total_weight for k, v in weights.items()}

	return weights

	def _calculate_market_adjustment(self, model_name: str) -> float:
	"""Calcula ajuste baseado nas condições de mercado"""
	# Diferentes modelos podem ter performance melhor em diferentes condições
	model_preferences = {
	'FinBERT': {
	'high_volatility': 1.2,
	'strong_trend': 1.1,
	'high_volume': 1.0
	},
	'DistilBERT-Financial': {
	'high_volatility': 1.0,
	'strong_trend': 1.2,
	'high_volume': 1.1
	},
	'RoBERTa-Sentiment': {
	'high_volatility': 0.9,
	'strong_trend': 1.0,
	'high_volume': 1.2
	},
	'BERT-Base': {
	'high_volatility': 1.0,
	'strong_trend': 1.0,
	'high_volume': 1.0
	}
	}

	preferences = model_preferences.get(model_name, {
	'high_volatility': 1.0,
	'strong_trend': 1.0,
	'high_volume': 1.0
	})

	# Calcular fator de ajuste
	volatility_factor = preferences['high_volatility'] if self.market_conditions['volatility'] > 0.7 else 1.0
	trend_factor = preferences['strong_trend'] if self.market_conditions['trend_strength'] > 0.7 else 1.0
	volume_factor = preferences['high_volume'] if self.market_conditions['volume_profile'] > 0.7 else 1.0

	return (volatility_factor + trend_factor + volume_factor) / 3.0

	class IntelligentVotingSystem:
	"""Sistema de votação inteligente com múltiplas estratégias"""

	def __init__(self):
	self.weight_calculator = AdaptiveWeightCalculator()
	self.voting_history = deque(maxlen=1000)
	self.strategy_performance = defaultdict(lambda: deque(maxlen=100))
	self.logger = logging.getLogger(__name__)

	# Configurações de estratégias
	self.strategy_configs = {
	VotingStrategy.SIMPLE_MAJORITY: {'threshold': 0.5},
	VotingStrategy.WEIGHTED_AVERAGE: {'min_confidence': 0.3},
	VotingStrategy.CONFIDENCE_WEIGHTED: {'confidence_power': 2.0},
	VotingStrategy.DYNAMIC_CONSENSUS: {'consensus_threshold': 0.7},
	VotingStrategy.BAYESIAN_FUSION: {'prior_strength': 0.1},
	VotingStrategy.ADAPTIVE_ENSEMBLE: {'adaptation_rate': 0.1}
	}

	def vote(self, predictions: List[Dict[str, Any]],
	strategy: VotingStrategy = VotingStrategy.ADAPTIVE_ENSEMBLE,
	market_context: Optional[Dict[str, float]] = None) -> VoteResult:
	"""Executa votação usando estratégia especificada"""
	start_time = datetime.now()

	if not predictions:
	return self._empty_vote_result(strategy, start_time)

	# Selecionar estratégia automaticamente se for ADAPTIVE_ENSEMBLE
	if strategy == VotingStrategy.ADAPTIVE_ENSEMBLE:
	strategy = self._select_best_strategy(predictions, market_context)

	# Executar votação
	result = self._execute_voting_strategy(predictions, strategy, market_context)

	# Calcular tempo de processamento
	processing_time = (datetime.now() - start_time).total_seconds()
	result.processing_time = processing_time

	# Armazenar no histórico
	self.voting_history.append({
	'timestamp': datetime.now(),
	'strategy': strategy,
	'result': result,
	'num_predictions': len(predictions)
	})

	return result

	def _select_best_strategy(self, predictions: List[Dict[str, Any]],
	market_context: Optional[Dict[str, float]]) -> VotingStrategy:
	"""Seleciona a melhor estratégia baseada no contexto"""
	# Analisar características das predições
	confidences = [p.get('confidence', 0.5) for p in predictions]
	avg_confidence = np.mean(confidences)
	confidence_variance = np.var(confidences)

	# Analisar consenso
	predictions_count = defaultdict(int)
	for p in predictions:
	predictions_count[p.get('prediction', 'NEUTRO')] += 1

	max_agreement = max(predictions_count.values()) / len(predictions)

	# Selecionar estratégia baseada nas características
	if max_agreement > 0.8: # Alto consenso
	return VotingStrategy.SIMPLE_MAJORITY
	elif avg_confidence > 0.8: # Alta confiança
	return VotingStrategy.CONFIDENCE_WEIGHTED
	elif confidence_variance > 0.1: # Alta variância na confiança
	return VotingStrategy.WEIGHTED_AVERAGE
	elif len(predictions) >= 4: # Muitos modelos
	return VotingStrategy.BAYESIAN_FUSION
	else:
	return VotingStrategy.DYNAMIC_CONSENSUS

	def _execute_voting_strategy(self, predictions: List[Dict[str, Any]],
	strategy: VotingStrategy,
	market_context: Optional[Dict[str, float]]) -> VoteResult:
	"""Executa a estratégia de votação especificada"""

	if strategy == VotingStrategy.SIMPLE_MAJORITY:
	return self._simple_majority_vote(predictions)
	elif strategy == VotingStrategy.WEIGHTED_AVERAGE:
	return self._weighted_average_vote(predictions, market_context)
	elif strategy == VotingStrategy.CONFIDENCE_WEIGHTED:
	return self._confidence_weighted_vote(predictions)
	elif strategy == VotingStrategy.DYNAMIC_CONSENSUS:
	return self._dynamic_consensus_vote(predictions)
	elif strategy == VotingStrategy.BAYESIAN_FUSION:
	return self._bayesian_fusion_vote(predictions)
	else:
	# Fallback para weighted average
	return self._weighted_average_vote(predictions, market_context)

	def _simple_majority_vote(self, predictions: List[Dict[str, Any]]) -> VoteResult:
	"""Votação por maioria simples"""
	vote_counts = defaultdict(int)

	for pred in predictions:
	vote_counts[pred.get('prediction', 'NEUTRO')] += 1

	# Encontrar vencedor
	winner = max(vote_counts.keys(), key=lambda k: vote_counts[k])
	max_votes = vote_counts[winner]

	# Calcular confiança e consenso
	confidence = max_votes / len(predictions)
	consensus_strength = confidence

	return VoteResult(
	decision=winner,
	confidence=confidence,
	consensus_strength=consensus_strength,
	strategy_used=VotingStrategy.SIMPLE_MAJORITY,
	individual_votes=[{'prediction': p.get('prediction'), 'confidence': p.get('confidence')} for p in predictions],
	metadata={'vote_counts': dict(vote_counts)},
	processing_time=0.0
	)

	def _weighted_average_vote(self, predictions: List[Dict[str, Any]],
	market_context: Optional[Dict[str, float]]) -> VoteResult:
	"""Votação por média ponderada"""
	model_names = [p.get('model_name', f'model_{i}') for i, p in enumerate(predictions)]
	weights = self.weight_calculator.calculate_adaptive_weights(model_names, market_context)

	# Calcular scores ponderados
	sentiment_scores = []
	total_weight = 0

	for i, pred in enumerate(predictions):
	model_name = model_names[i]
	weight = weights.get(model_name, 1.0)
	confidence = pred.get('confidence', 0.5)
	sentiment_score = pred.get('sentiment_score', 0.0)

	weighted_score = sentiment_score * weight * confidence
	sentiment_scores.append(weighted_score)
	total_weight += weight * confidence

	# Calcular resultado final
	if total_weight > 0:
	final_sentiment = sum(sentiment_scores) / total_weight
	else:
	final_sentiment = 0.0

	# Determinar decisão
	if final_sentiment > 0.1:
	decision = "POSITIVO"
	elif final_sentiment < -0.1:
	decision = "NEGATIVO"
	else:
	decision = "NEUTRO"

	# Calcular confiança média ponderada
	weighted_confidences = [p.get('confidence', 0.5) * weights.get(model_names[i], 1.0)
	for i, p in enumerate(predictions)]
	confidence = sum(weighted_confidences) / sum(weights.values()) if weights else 0.5

	# Calcular consenso
	consensus_strength = self._calculate_consensus_strength(predictions)

	return VoteResult(
	decision=decision,
	confidence=confidence,
	consensus_strength=consensus_strength,
	strategy_used=VotingStrategy.WEIGHTED_AVERAGE,
	individual_votes=[{'prediction': p.get('prediction'), 'confidence': p.get('confidence'),
	'weight': weights.get(model_names[i], 1.0)} for i, p in enumerate(predictions)],
	metadata={'final_sentiment': final_sentiment, 'weights': weights},
	processing_time=0.0
	)

	def _confidence_weighted_vote(self, predictions: List[Dict[str, Any]]) -> VoteResult:
	"""Votação ponderada pela confiança"""
	power = self.strategy_configs[VotingStrategy.CONFIDENCE_WEIGHTED]['confidence_power']

	# Calcular pesos baseados na confiança
	weighted_votes = defaultdict(float)
	total_weight = 0

	for pred in predictions:
	confidence = pred.get('confidence', 0.5)
	prediction = pred.get('prediction', 'NEUTRO')
	weight = confidence ** power

	weighted_votes[prediction] += weight
	total_weight += weight

	# Normalizar
	if total_weight > 0:
	weighted_votes = {k: v / total_weight for k, v in weighted_votes.items()}

	# Encontrar vencedor
	winner = max(weighted_votes.keys(), key=lambda k: weighted_votes[k])
	confidence = weighted_votes[winner]

	# Calcular consenso
	consensus_strength = confidence

	return VoteResult(
	decision=winner,
	confidence=confidence,
	consensus_strength=consensus_strength,
	strategy_used=VotingStrategy.CONFIDENCE_WEIGHTED,
	individual_votes=[{'prediction': p.get('prediction'), 'confidence': p.get('confidence')} for p in predictions],
	metadata={'weighted_votes': dict(weighted_votes)},
	processing_time=0.0
	)

	def _dynamic_consensus_vote(self, predictions: List[Dict[str, Any]]) -> VoteResult:
	"""Votação por consenso dinâmico"""
	threshold = self.strategy_configs[VotingStrategy.DYNAMIC_CONSENSUS]['consensus_threshold']

	# Agrupar por predição
	groups = defaultdict(list)
	for pred in predictions:
	groups[pred.get('prediction', 'NEUTRO')].append(pred)

	# Encontrar grupo com maior consenso
	best_group = None
	best_consensus = 0

	for prediction, group in groups.items():
	# Calcular consenso do grupo
	confidences = [p.get('confidence', 0.5) for p in group]
	group_size_factor = len(group) / len(predictions)
	avg_confidence = np.mean(confidences)
	consensus = group_size_factor * avg_confidence

	if consensus > best_consensus:
	best_consensus = consensus
	best_group = (prediction, group)

	if best_group and best_consensus >= threshold:
	decision = best_group[0]
	confidence = best_consensus
	else:
	# Fallback para neutro se não há consenso suficiente
	decision = "NEUTRO"
	confidence = 0.5

	return VoteResult(
	decision=decision,
	confidence=confidence,
	consensus_strength=best_consensus,
	strategy_used=VotingStrategy.DYNAMIC_CONSENSUS,
	individual_votes=[{'prediction': p.get('prediction'), 'confidence': p.get('confidence')} for p in predictions],
	metadata={'threshold': threshold, 'groups': {k: len(v) for k, v in groups.items()}},
	processing_time=0.0
	)

	def _bayesian_fusion_vote(self, predictions: List[Dict[str, Any]]) -> VoteResult:
	"""Votação usando fusão Bayesiana"""
	prior_strength = self.strategy_configs[VotingStrategy.BAYESIAN_FUSION]['prior_strength']

	# Prior uniforme
	classes = ['POSITIVO', 'NEUTRO', 'NEGATIVO']
	prior = {cls: 1.0/len(classes) for cls in classes}

	# Calcular likelihood para cada classe
	posteriors = prior.copy()

	for pred in predictions:
	prediction = pred.get('prediction', 'NEUTRO')
	confidence = pred.get('confidence', 0.5)

	# Atualizar posterior
	for cls in classes:
	if cls == prediction:
	likelihood = confidence
	else:
	likelihood = (1 - confidence) / (len(classes) - 1)

	posteriors[cls] = (prior_strength prior[cls] + likelihood)

	# Normalizar
	total = sum(posteriors.values())
	if total > 0:
	posteriors = {k: v / total for k, v in posteriors.items()}

	# Encontrar classe com maior probabilidade
	winner = max(posteriors.keys(), key=lambda k: posteriors[k])
	confidence = posteriors[winner]

	# Calcular consenso baseado na distribuição
	entropy = -sum(p * np.log(p + 1e-10) for p in posteriors.values())
	max_entropy = np.log(len(classes))
	consensus_strength = 1 - (entropy / max_entropy)

	return VoteResult(
	decision=winner,
	confidence=confidence,
	consensus_strength=consensus_strength,
	strategy_used=VotingStrategy.BAYESIAN_FUSION,
	individual_votes=[{'prediction': p.get('prediction'), 'confidence': p.get('confidence')} for p in predictions],
	metadata={'posteriors': posteriors, 'entropy': entropy},
	processing_time=0.0
	)

	def _calculate_consensus_strength(self, predictions: List[Dict[str, Any]]) -> float:
	"""Calcula força do consenso entre predições"""
	if not predictions:
	return 0.0

	# Contar predições por classe
	counts = defaultdict(int)
	for pred in predictions:
	counts[pred.get('prediction', 'NEUTRO')] += 1

	# Calcular consenso
	max_count = max(counts.values())
	consensus = max_count / len(predictions)

	return consensus

	def _empty_vote_result(self, strategy: VotingStrategy, start_time: datetime) -> VoteResult:
	"""Resultado para quando não há predições"""
	return VoteResult(
	decision="NEUTRO",
	confidence=0.0,
	consensus_strength=0.0,
	strategy_used=strategy,
	individual_votes=[],
	metadata={'error': 'no_predictions'},
	processing_time=(datetime.now() - start_time).total_seconds()
	)

	def update_strategy_performance(self, strategy: VotingStrategy, accuracy: float):
	"""Atualiza performance de uma estratégia"""
	self.strategy_performance[strategy].append(accuracy)

	def get_best_strategy(self) -> VotingStrategy:
	"""Retorna a estratégia com melhor performance recente"""
	if not self.strategy_performance:
	return VotingStrategy.ADAPTIVE_ENSEMBLE

	best_strategy = VotingStrategy.ADAPTIVE_ENSEMBLE
	best_performance = 0.0

	for strategy, performances in self.strategy_performance.items():
	if len(performances) >= 5: # Mínimo de amostras
	avg_performance = np.mean(list(performances)[-10:]) # Últimas 10
	if avg_performance > best_performance:
	best_performance = avg_performance
	best_strategy = strategy

	return best_strategy

	def get_voting_stats(self) -> Dict[str, Any]:
	"""Retorna estatísticas do sistema de votação"""
	stats = {
	'total_votes': len(self.voting_history),
	'strategy_usage': defaultdict(int),
	'avg_processing_time': 0.0,
	'avg_consensus_strength': 0.0,
	'strategy_performance': {}
	}

	if self.voting_history:
	# Contar uso de estratégias
	for vote in self.voting_history:
	stats['strategy_usage'][vote['strategy'].value] += 1

	# Calcular médias
	processing_times = [vote['result'].processing_time for vote in self.voting_history]
	consensus_strengths = [vote['result'].consensus_strength for vote in self.voting_history]

	stats['avg_processing_time'] = np.mean(processing_times)
	stats['avg_consensus_strength'] = np.mean(consensus_strengths)

	# Performance das estratégias
	for strategy, performances in self.strategy_performance.items():
	if performances:
	stats['strategy_performance'][strategy.value] = {
	'avg_accuracy': np.mean(list(performances)),
	'recent_accuracy': np.mean(list(performances)[-10:]) if len(performances) >= 10 else np.mean(list(performances)),
	'sample_count': len(performances)
	}

	return dict(stats)

	# Instância global do sistema de votação
	voting_system = IntelligentVotingSystem()

	# Função de conveniência
	def intelligent_vote(predictions: List[Dict[str, Any]],
	strategy: VotingStrategy = VotingStrategy.ADAPTIVE_ENSEMBLE,
	market_context: Optional[Dict[str, float]] = None) -> VoteResult:
	"""Função principal para votação inteligente"""
	return voting_system.vote(predictions, strategy, market_context)

	if __name__ == "__main__":
	# Teste do sistema
	test_predictions = [
	{'model_name': 'FinBERT', 'prediction': 'POSITIVO', 'confidence': 0.8, 'sentiment_score': 0.6},
	{'model_name': 'DistilBERT', 'prediction': 'POSITIVO', 'confidence': 0.7, 'sentiment_score': 0.4},
	{'model_name': 'RoBERTa', 'prediction': 'NEUTRO', 'confidence': 0.6, 'sentiment_score': 0.1},
	{'model_name': 'BERT', 'prediction': 'POSITIVO', 'confidence': 0.9, 'sentiment_score': 0.7}
	]

	print("Testando sistema de votação inteligente...")

	for strategy in VotingStrategy:
	result = intelligent_vote(test_predictions, strategy)
	print(f"\nEstratégia: {strategy.value}")
	print(f"Decisão: {result.decision}")
	print(f"Confiança: {result.confidence:.3f}")
	print(f"Consenso: {result.consensus_strength:.3f}")
	print(f"Tempo: {result.processing_time:.3f}s")