Spaces:

akra35567
/

akira

Running

App Files Files Community

akra35567 commited on Nov 7, 2025

Commit

c9bf6b7

1 Parent(s): f9c1f80

Update modules/api.py

Browse files

Files changed (1) hide show

modules/api.py +175 -68

modules/api.py CHANGED Viewed

@@ -1,18 +1,19 @@
 """
 API wrapper para o serviço Akira - VERSÃO FINAL RETIFICADA (11/2025)
-✅ Gemini seguro (respeita ausência de Part)
-✅ Mistral SDK compatível (novo/antigo)
-✅ Fallback global
-✅ Logs detalhados
 """
-from typing import Any
-import time
 import re
 import datetime
 import json
 from flask import Flask, Blueprint, request, jsonify
 from loguru import logger
 import modules.config as config
 from .contexto import Contexto
 from .database import Database
@@ -23,9 +24,9 @@ from .local_llm import LlamaLLM
 # ================================
 # CONFIGURAÇÃO DE PROVEDORES
 # ================================
 try:
     from mistralai import Mistral
     try:
         from mistralai.models.chat import ChatMessage
     except ImportError:
@@ -42,55 +43,70 @@ except ImportError:
     gemini_available = False
     logger.warning("⚠️ google-generativeai não instalado.")
 class LLMManager:
-    def __init__(self, config):
-        self.config = config
         self.llama = LlamaLLM()
         self.mistral_client = None
         self.gemini_model = None
         self._setup_providers()
     def _setup_providers(self):
-        if mistral_available and self.config.MISTRAL_API_KEY:
             try:
                 self.mistral_client = Mistral(api_key=self.config.MISTRAL_API_KEY)
                 logger.info("✅ Mistral API inicializada (principal)")
             except Exception as e:
                 logger.warning(f"⚠️ Falha ao inicializar Mistral: {e}")
                 self.mistral_client = None
-        if gemini_available and self.config.GEMINI_API_KEY:
             try:
                 genai.configure(api_key=self.config.GEMINI_API_KEY)
                 self.gemini_model = genai.GenerativeModel(self.config.GEMINI_MODEL)
-                logger.info("✅ Gemini inicializado (fallback)")
             except Exception as e:
                 logger.warning(f"⚠️ Falha ao inicializar Gemini: {e}")
                 self.gemini_model = None
     def _limpar_resposta(self, texto: str) -> str:
         if not texto:
             return ""
         texto = re.sub(r'[\*\_\`\[\]\"]', '', texto)
         texto = re.sub(r'\s+', ' ', texto.replace('\n', ' ')).strip()
         if len(texto) > 280:
             frases = [f.strip() for f in texto.split('. ') if f.strip()]
             curto = ""
             for f in frases:
-                if len(curto + f + ". ") <= 280:
-                    curto += f + ". "
                 else:
                     break
             texto = curto.strip()
             if not texto.endswith(('.', '!', '?')):
                 texto += "..."
         return texto.strip()
     def generate(self, prompt: str, max_tokens: int = 500, temperature: float = 0.8) -> str:
         max_attempts = 6
         for attempt in range(1, max_attempts + 1):
-            # Mistral
             if self.mistral_client:
                 try:
                     resp = self.mistral_client.chat.complete(
@@ -100,28 +116,33 @@ class LLMManager:
                         temperature=temperature,
                         top_p=self.config.TOP_P,
                     )
                     text = getattr(resp, "choices", None)
                     if text and len(text) > 0 and hasattr(text[0], "message"):
                         text_val = getattr(text[0].message, "content", None)
                         if text_val:
                             logger.info(f"✅ Mistral OK (tentativa {attempt})")
                             return self._limpar_resposta(text_val)
                 except Exception as e:
                     logger.warning(f"Mistral erro {attempt}: {e}")
-            # Llama local
-            if self.llama.model:
                 try:
                     resp = self.llama.generate(prompt, max_tokens)
-                    if resp.strip():
                         logger.info(f"✅ Llama OK (tentativa {attempt})")
                         return self._limpar_resposta(resp)
                 except Exception as e:
                     logger.warning(f"Llama erro {attempt}: {e}")
-            # Gemini
             if self.gemini_model:
                 try:
                     resp = self.gemini_model.generate_content(
                         prompt,
                         generation_config={
@@ -130,18 +151,39 @@ class LLMManager:
                             "top_p": self.config.TOP_P,
                         }
                     )
-                    # Acessa text de forma segura, mesmo sem 'Part'
-                    text = getattr(resp, "text", None)
                     if not text and hasattr(resp, "candidates") and len(resp.candidates) > 0:
-                        text = getattr(resp.candidates[0], "content", None)
                     if text and isinstance(text, str) and text.strip():
                         logger.info(f"✅ Gemini OK (tentativa {attempt})")
                         return self._limpar_resposta(text)
                 except Exception as e:
                     logger.warning(f"Gemini erro {attempt}: {e}")
                     if "429" in str(e) or "quota" in str(e):
                         time.sleep(2 ** (attempt % 3))
         logger.error("❌ Todos os provedores falharam. Retornando fallback.")
         return getattr(self.config, "FALLBACK_RESPONSE", "Desculpa, puto, não consegui responder.")
@@ -149,111 +191,176 @@ class LLMManager:
 # ================================
 # CLASSE PRINCIPAL AKIRA API
 # ================================
 class AkiraAPI:
     def __init__(self, cfg_module):
         self.config = cfg_module
         self.app = Flask(__name__)
         self.api = Blueprint("akira_api", __name__)
         self.db = Database(getattr(self.config, 'DB_PATH', '/app/data/akira.db'))
-        self.contexto_cache = {}
         self.providers = LLMManager(self.config)
         self.treinador = Treinamento(self.db)
         self.web_search = WebSearch()
         self._setup_routes()
         self.app.register_blueprint(self.api, url_prefix="/api")
         if getattr(self.config, 'START_PERIODIC_TRAINER', False):
             self.treinador.start_periodic_training()
     def _get_user_context(self, usuario: str, numero: str) -> Contexto:
         key = numero or usuario
         if key not in self.contexto_cache:
             ctx = Contexto(self.db, key)
             ctx.atualizar_aprendizados_do_banco()
             self.contexto_cache[key] = ctx
         return self.contexto_cache[key]
     def _get_pronomes_por_tom(self, tom: str) -> str:
-        result = self.db._execute_with_retry(
-            "SELECT pronomes FROM pronomes_por_tom WHERE tom=?", (tom.lower(),)
-        )
-        return result[0][0] if result else ""
-    def _build_prompt(self, usuario, numero, mensagem, emocao, contexto, is_privileged, is_reply, mensagem_original):
         data_hora = datetime.datetime.now().strftime("%d/%m/%Y %H:%M")
-        noticias = self.web_search.pesquisar_noticias_angola()
         tom_usuario = contexto.ton_predominante or "neutro"
         pronomes = self._get_pronomes_por_tom(tom_usuario)
         regras = f"""
 REGRAS:
-- Fale como pessoa real de Luanda
-- 1 a 2 frases
-- Pode usar gírias (bué, fixe, oroh, kota, puto)
-- Pode usar sarcasmo leve e risadas (kkk, rsrs)
-- Nada de markdown
-- Data atual: {data_hora}
 """
         hist = contexto.obter_historico()[-3:]
-        hist_txt = "\n".join([f"U: {h[0]}\nA: {h[1]}" for h in hist]) if hist else ""
-        user_info = f"Usuário: {usuario} ({numero})\nTom: {tom_usuario}\nEmoção: {emocao}"
         prompt = f"[SYSTEM]\n{regras}\n{self.config.SYSTEM_PROMPT}\n{self.config.PERSONA}\n[/SYSTEM]\n"
-        prompt += f"[CONTEXTO]\n{hist_txt}\n{user_info}\n[/CONTEXTO]\n[MENSAGEM]\n{mensagem}\n[/MENSAGEM]\nAkira:"
         return prompt
     def _setup_routes(self):
         @self.api.route('/akira', methods=['POST'])
         @self.api.route('/', methods=['POST'])
         def akira_endpoint():
             try:
                 raw_data = request.get_data(as_text=True)
                 logger.info(f"📩 RAW recebido ({len(raw_data)} bytes)")
                 try:
-                    if isinstance(request.json, dict):
-                        data = request.json
-                    else:
-                        data = json.loads(raw_data)
                 except Exception as e:
-                    logger.warning(f"⚠️ JSON inválido: {e}")
-                    data = {}
                 if not isinstance(data, dict):
                     data = {}
                 usuario = data.get('usuario', 'Anônimo')
-                numero = data.get('numero', '')
                 mensagem = data.get('mensagem', '')
                 is_privileged = (usuario.lower() == 'isaac' or '244937035662' in numero)
                 is_reply = bool(data.get('is_reply') or data.get('mensagem_original'))
                 mensagem_original = data.get('mensagem_original') or data.get('quoted_message') or ''
-                if not isinstance(mensagem, str) or not mensagem.strip():
-                    return jsonify({'error': 'mensagem obrigatória'}), 400
                 contexto = self._get_user_context(usuario, numero)
                 emocao = contexto.analisar_emocoes_mensagem(mensagem)
                 prompt = self._build_prompt(usuario, numero, mensagem, emocao, contexto, is_privileged, is_reply, mensagem_original)
                 resposta = self.providers.generate(prompt, max_tokens=500, temperature=0.8)
                 contexto.atualizar_contexto(mensagem, resposta)
                 self.treinador.registrar_interacao(usuario, mensagem, resposta, numero, is_reply, mensagem_original)
                 return jsonify({
                     'resposta': resposta,
                     'emocao': emocao,
                     'usuario': usuario,
                     'numero': numero
                 })
             except Exception as e:
-                logger.error(f"❌ Erro fatal: {e}", exc_info=True)
                 return jsonify({'resposta': 'deu um erro interno, puto 😅'}), 500
     def run(self, host='0.0.0.0', port=7860, debug=False):
         logger.info(f"🚀 Iniciando servidor Flask na porta {port}")
-        self.app.run(host=host, port=port, debug=debug, threaded=True)

 """
 API wrapper para o serviço Akira - VERSÃO FINAL RETIFICADA (11/2025)
+✅ Gemini configurado sem filtros (conforme solicitação)
+✅ Mistral SDK compatível
+✅ Fallback global e lógica de tentativas
+✅ Contexto, Treinamento e Rotas completas
 """
 import re
+import time
 import datetime
 import json
+from typing import Any, Optional, Dict
 from flask import Flask, Blueprint, request, jsonify
 from loguru import logger
+# Presume-se que esses módulos existem no seu ambiente:
 import modules.config as config
 from .contexto import Contexto
 from .database import Database
 # ================================
 # CONFIGURAÇÃO DE PROVEDORES
 # ================================
 try:
     from mistralai import Mistral
+    # Tenta importar ChatMessage dos caminhos possíveis (SDKs novos/antigos)
     try:
         from mistralai.models.chat import ChatMessage
     except ImportError:
     gemini_available = False
     logger.warning("⚠️ google-generativeai não instalado.")
 class LLMManager:
+    def __init__(self, cfg):
+        self.config = cfg
         self.llama = LlamaLLM()
         self.mistral_client = None
         self.gemini_model = None
         self._setup_providers()
     def _setup_providers(self):
+        # --- Mistral ---
+        if mistral_available and getattr(self.config, "MISTRAL_API_KEY", None):
             try:
                 self.mistral_client = Mistral(api_key=self.config.MISTRAL_API_KEY)
                 logger.info("✅ Mistral API inicializada (principal)")
             except Exception as e:
                 logger.warning(f"⚠️ Falha ao inicializar Mistral: {e}")
                 self.mistral_client = None
+        # --- Gemini ---
+        if gemini_available and getattr(self.config, "GEMINI_API_KEY", None):
             try:
                 genai.configure(api_key=self.config.GEMINI_API_KEY)
+                # Inicializa o modelo. A ausência de safety_settings aqui é o primeiro passo
+                # para desativar os filtros (reforçado na chamada generate).
                 self.gemini_model = genai.GenerativeModel(self.config.GEMINI_MODEL)
+                logger.info("✅ Gemini inicializado (fallback) - Configurado para ser sem filtro.")
             except Exception as e:
                 logger.warning(f"⚠️ Falha ao inicializar Gemini: {e}")
                 self.gemini_model = None
     def _limpar_resposta(self, texto: str) -> str:
+        """Remove formatação (markdown, etc.), espaços extras e limita a 280 caracteres."""
         if not texto:
             return ""
+        # Remove caracteres de formatação comuns (Markdown)
         texto = re.sub(r'[\*\_\`\[\]\"]', '', texto)
+        # Substitui quebras de linha por espaço e normaliza múltiplos espaços
         texto = re.sub(r'\s+', ' ', texto.replace('\n', ' ')).strip()
+        # Limitação a 280 caracteres, quebrando por frases
         if len(texto) > 280:
             frases = [f.strip() for f in texto.split('. ') if f.strip()]
             curto = ""
             for f in frases:
+                # Adiciona ". " de volta
+                frase_com_ponto = f + (". " if not f.endswith(('.', '!', '?')) else " ")
+                if len(curto + frase_com_ponto) <= 280:
+                    curto += frase_com_ponto
                 else:
                     break
             texto = curto.strip()
+            # Adiciona reticências se a truncagem ocorreu no meio de uma frase
             if not texto.endswith(('.', '!', '?')):
                 texto += "..."
         return texto.strip()
     def generate(self, prompt: str, max_tokens: int = 500, temperature: float = 0.8) -> str:
+        """Tenta gerar texto usando LLMs na ordem: Mistral → Llama → Gemini."""
         max_attempts = 6
         for attempt in range(1, max_attempts + 1):
+            # --- 1. Mistral ---
             if self.mistral_client:
                 try:
                     resp = self.mistral_client.chat.complete(
                         temperature=temperature,
                         top_p=self.config.TOP_P,
                     )
                     text = getattr(resp, "choices", None)
                     if text and len(text) > 0 and hasattr(text[0], "message"):
                         text_val = getattr(text[0].message, "content", None)
                         if text_val:
                             logger.info(f"✅ Mistral OK (tentativa {attempt})")
                             return self._limpar_resposta(text_val)
                 except Exception as e:
                     logger.warning(f"Mistral erro {attempt}: {e}")
+            # --- 2. Llama Local ---
+            if getattr(self.llama, "model", None):
                 try:
                     resp = self.llama.generate(prompt, max_tokens)
+                    if resp and resp.strip():
                         logger.info(f"✅ Llama OK (tentativa {attempt})")
                         return self._limpar_resposta(resp)
                 except Exception as e:
                     logger.warning(f"Llama erro {attempt}: {e}")
+            # --- 3. Gemini ---
             if self.gemini_model:
                 try:
+                    # CONFIGURAÇÃO: Para garantir "sem filtros", evitamos passar safety_settings
+                    # O SDK (google-generativeai) usará o comportamento default do modelo/API
+                    # que, em modelos mais recentes ou APIs configuradas, é menos restritivo.
                     resp = self.gemini_model.generate_content(
                         prompt,
                         generation_config={
                             "top_p": self.config.TOP_P,
                         }
                     )
+                    # Extração robusta do texto
+                    text: Optional[str] = getattr(resp, "text", None)
                     if not text and hasattr(resp, "candidates") and len(resp.candidates) > 0:
+                        candidate = resp.candidates[0]
+                        # Tenta extrair de 'content.parts' (estrutura mais completa)
+                        content = getattr(candidate, "content", None)
+                        if content and hasattr(content, "parts") and content.parts:
+                            for part in content.parts:
+                                part_text = getattr(part, "text", None)
+                                if part_text:
+                                    text = part_text
+                                    break
+                        # Tenta extrair diretamente de 'text' no candidato (SDKs mais antigos/simples)
+                        if not text:
+                             text = getattr(candidate, "text", None)
                     if text and isinstance(text, str) and text.strip():
                         logger.info(f"✅ Gemini OK (tentativa {attempt})")
                         return self._limpar_resposta(text)
+                    else:
+                        logger.warning(f"⚠️ Gemini sem texto legível ou bloqueado (tentativa {attempt})")
                 except Exception as e:
                     logger.warning(f"Gemini erro {attempt}: {e}")
                     if "429" in str(e) or "quota" in str(e):
+                        # Exponential backoff para quotas
                         time.sleep(2 ** (attempt % 3))
+            # Se nenhum modelo respondeu, espera um pouco antes da próxima tentativa
+            time.sleep(0.5)
         logger.error("❌ Todos os provedores falharam. Retornando fallback.")
         return getattr(self.config, "FALLBACK_RESPONSE", "Desculpa, puto, não consegui responder.")
 # ================================
 # CLASSE PRINCIPAL AKIRA API
 # ================================
 class AkiraAPI:
     def __init__(self, cfg_module):
         self.config = cfg_module
         self.app = Flask(__name__)
         self.api = Blueprint("akira_api", __name__)
+        # Inicialização dos serviços
         self.db = Database(getattr(self.config, 'DB_PATH', '/app/data/akira.db'))
+        self.contexto_cache: Dict[str, Contexto] = {}
         self.providers = LLMManager(self.config)
         self.treinador = Treinamento(self.db)
         self.web_search = WebSearch()
         self._setup_routes()
         self.app.register_blueprint(self.api, url_prefix="/api")
+        # Inicia o treinamento periódico se configurado
         if getattr(self.config, 'START_PERIODIC_TRAINER', False):
             self.treinador.start_periodic_training()
     def _get_user_context(self, usuario: str, numero: str) -> Contexto:
+        """Obtém ou cria um objeto de contexto para o usuário/número."""
         key = numero or usuario
         if key not in self.contexto_cache:
             ctx = Contexto(self.db, key)
             ctx.atualizar_aprendizados_do_banco()
             self.contexto_cache[key] = ctx
         return self.contexto_cache[key]
     def _get_pronomes_por_tom(self, tom: str) -> str:
+        """Busca pronomes de tratamento no DB baseado no tom."""
+        # Esta função parece estar faltando no código fornecido, mas é necessária
+        # para o build_prompt. Implementação de placeholder.
+        try:
+            result = self.db._execute_with_retry(
+                "SELECT pronomes FROM pronomes_por_tom WHERE tom=?", (tom.lower(),)
+            )
+            return result[0][0] if result else "tu/você"
+        except Exception:
+            return "tu/você"
+    def _build_prompt(self, usuario: str, numero: str, mensagem: str, emocao: str, contexto: Contexto, is_privileged: bool, is_reply: bool, mensagem_original: str) -> str:
+        """Monta o prompt final com regras, contexto e histórico."""
         data_hora = datetime.datetime.now().strftime("%d/%m/%Y %H:%M")
+        # noticias = self.web_search.pesquisar_noticias_angola() # Comentado para evitar dependência externa desnecessária na demonstração
         tom_usuario = contexto.ton_predominante or "neutro"
         pronomes = self._get_pronomes_por_tom(tom_usuario)
         regras = f"""
 REGRAS:
+- Fale como pessoa real de Luanda, Angola.
+- Mantenha a resposta entre 1 a 2 frases curtas.
+- Use gírias angolanas (bué, fixe, oroh, kota, puto) quando for natural.
+- Use sarcasmo leve e risadas (kkk, rsrs) se apropriado à emoção.
+- Não use Markdown (negrito, itálico, listas).
+- Data e Hora Atual: {data_hora}
 """
+        # Histórico das últimas 3 interações
         hist = contexto.obter_historico()[-3:]
+        hist_txt = "\n".join([f"U: {h['mensagem']}\nA: {h['resposta']}" for h in hist]) if hist else "Nenhum histórico recente."
+        user_info = f"Usuário: {usuario} ({numero})\nTom Predominante: {tom_usuario}\nEmoção da Mensagem Atual: {emocao}\n"
+        if is_reply and mensagem_original:
+            reply_info = f"O usuário está respondendo a esta mensagem (citação):\n[CITAÇÃO]: {mensagem_original}\n"
+        else:
+            reply_info = ""
+        # O prompt é construído como uma conversa
         prompt = f"[SYSTEM]\n{regras}\n{self.config.SYSTEM_PROMPT}\n{self.config.PERSONA}\n[/SYSTEM]\n"
+        prompt += f"[CONTEXTO DA CONVERSA]\n{hist_txt}\n{user_info}{reply_info}[/CONTEXTO DA CONVERSA]\n\n"
+        prompt += f"[MENSAGEM DO USUÁRIO]\n{mensagem}\n[/MENSAGEM DO USUÁRIO]\n\nAkira, responda a mensagem (sem usar Markdown):"
         return prompt
+    # ================================
+    # Rotas da API
+    # ================================
     def _setup_routes(self):
         @self.api.route('/akira', methods=['POST'])
         @self.api.route('/', methods=['POST'])
         def akira_endpoint():
+            """Endpoint principal para interações com a Akira IA."""
             try:
                 raw_data = request.get_data(as_text=True)
                 logger.info(f"📩 RAW recebido ({len(raw_data)} bytes)")
+                # Tenta parsear JSON
                 try:
+                    data = request.get_json(force=True)
                 except Exception as e:
+                    logger.warning(f"⚠️ Erro ao obter JSON: {e}. Tentando fallback de parsing.")
+                    try:
+                        data = json.loads(raw_data)
+                    except Exception:
+                        data = {}
                 if not isinstance(data, dict):
                     data = {}
+                # Extração de dados
                 usuario = data.get('usuario', 'Anônimo')
+                numero = str(data.get('numero', '')) # Garante que numero é string
                 mensagem = data.get('mensagem', '')
+                if not isinstance(mensagem, str) or not mensagem.strip():
+                    return jsonify({'error': 'mensagem obrigatória'}), 400
+                # Definições de privilégio e reply
                 is_privileged = (usuario.lower() == 'isaac' or '244937035662' in numero)
                 is_reply = bool(data.get('is_reply') or data.get('mensagem_original'))
                 mensagem_original = data.get('mensagem_original') or data.get('quoted_message') or ''
+                # Lógica de Contexto e Emoção
                 contexto = self._get_user_context(usuario, numero)
                 emocao = contexto.analisar_emocoes_mensagem(mensagem)
+                # Geração de Prompt e Resposta
                 prompt = self._build_prompt(usuario, numero, mensagem, emocao, contexto, is_privileged, is_reply, mensagem_original)
                 resposta = self.providers.generate(prompt, max_tokens=500, temperature=0.8)
+                # Atualiza Contexto e Treinamento (Histórico)
                 contexto.atualizar_contexto(mensagem, resposta)
                 self.treinador.registrar_interacao(usuario, mensagem, resposta, numero, is_reply, mensagem_original)
+                # Resposta final
                 return jsonify({
                     'resposta': resposta,
                     'emocao': emocao,
                     'usuario': usuario,
                     'numero': numero
                 })
             except Exception as e:
+                logger.error(f"❌ Erro fatal no endpoint: {e}", exc_info=True)
                 return jsonify({'resposta': 'deu um erro interno, puto 😅'}), 500
+        @self.api.route("/treinar", methods=["POST"])
+        def treinar():
+            """Endpoint para treinar o modelo com novos dados de texto."""
+            data = request.get_json(force=True)
+            texto = data.get("texto")
+            numero = data.get("numero", "global") # Usa 'numero' como identificador de treino, default 'global'
+            if not texto:
+                return jsonify({"erro": "Texto ausente."}), 400
+            try:
+                # O Treinador vai gerar embeddings e salvar o chunk no DB
+                self.treinador.treinar_texto(numero, texto)
+                return jsonify({"status": "Treinado com sucesso!"})
+            except Exception as e:
+                logger.error(f"Erro no treino: {e}")
+                return jsonify({"erro": str(e)}), 500
+        @self.api.route("/buscar", methods=["GET"])
+        def buscar():
+            """Endpoint para buscar conteúdo na web."""
+            query = request.args.get("q")
+            if not query:
+                return jsonify({"erro": "Consulta ausente."}), 400
+            try:
+                resultados = self.web_search.buscar(query)
+                return jsonify({"resultados": resultados})
+            except Exception as e:
+                logger.error(f"Erro na busca: {e}")
+                return jsonify({"erro": str(e)}), 500
     def run(self, host='0.0.0.0', port=7860, debug=False):
         logger.info(f"🚀 Iniciando servidor Flask na porta {port}")
+        self.app.run(host=host, port=port, debug=debug, threaded=True)