Spaces:

akra35567
/

akira

Running

App Files Files Community

akra35567 commited on 23 days ago

Commit

11ebde4

verified ·

1 Parent(s): 7e26b2d

Upload 22 files

Browse files

Files changed (4) hide show

modules/api.py +20 -4
modules/config.py +8 -2
modules/local_llm.py +2 -1
modules/web_search.py +18 -4

modules/api.py CHANGED Viewed

@@ -202,11 +202,17 @@ class LLMManager:
         # 2. Google Gemini
         if genai:
             try:
-                # Usa nome do modelo vindo do config ou fallback
                 gemini_key = getattr(config, "GEMINI_API_KEY", None)
-                model_name = getattr(config, "GEMINI_MODEL", "gemini-1.5-flash")
                 if gemini_key:
                     if GEMINI_USING_NEW_API:
                         self.gemini_client = genai.Client(api_key=gemini_key)
                         logger.info(f"Google Gemini (Novo) ativo: {model_name}")
@@ -214,6 +220,8 @@ class LLMManager:
                         genai.configure(api_key=gemini_key)
                         self.gemini_model = genai.GenerativeModel(model_name)
                         logger.info(f"Google Gemini (Legado) ativo: {model_name}")
             except Exception as e:
                 logger.error(f"Erro ao configurar Gemini: {e}")
                 self.gemini_model = None
@@ -444,8 +452,12 @@ class LLMManager:
                 content = turn.get("content", "")
                 messages.append({"role": role, "content": content})
             messages.append({"role": "user", "content": user_prompt})
             resp = self.groq_client.chat.completions.create(
-                model='llama-3.3-70b-versatile',
                 messages=messages,
                 temperature=0.7,
                 max_tokens=1000
@@ -515,8 +527,12 @@ class LLMManager:
                 content = turn.get("content", "")
                 messages.append({"role": role, "content": content})
             messages.append({"role": "user", "content": user_prompt})
             resp = self.together_client.chat.completions.create(
-                model='meta-llama/Llama-3.3-70B-Instruct-Turbo',
                 messages=messages,
                 temperature=0.7,
                 max_tokens=1000

         # 2. Google Gemini
         if genai:
             try:
+                # Prioriza a chave do config que já limpamos
                 gemini_key = getattr(config, "GEMINI_API_KEY", None)
+                model_name = getattr(config, "GEMINI_MODEL", "gemini-2.0-flash")
                 if gemini_key:
+                    # Resolve conflito de variáveis de ambiente do SDK
+                    # O SDK do Google prioriza GOOGLE_API_KEY. Se queremos usar a GEMINI_API_KEY do config,
+                    # limpamos a do ambiente para garantir consistência.
+                    if os.getenv("GOOGLE_API_KEY") != gemini_key:
+                        os.environ["GOOGLE_API_KEY"] = gemini_key
                     if GEMINI_USING_NEW_API:
                         self.gemini_client = genai.Client(api_key=gemini_key)
                         logger.info(f"Google Gemini (Novo) ativo: {model_name}")
                         genai.configure(api_key=gemini_key)
                         self.gemini_model = genai.GenerativeModel(model_name)
                         logger.info(f"Google Gemini (Legado) ativo: {model_name}")
+                else:
+                    logger.warning("Gemini não configurado: Chave ausente")
             except Exception as e:
                 logger.error(f"Erro ao configurar Gemini: {e}")
                 self.gemini_model = None
                 content = turn.get("content", "")
                 messages.append({"role": role, "content": content})
             messages.append({"role": "user", "content": user_prompt})
+            # Usar modelo do config
+            model_name = getattr(config, 'GROQ_MODEL', 'llama-3.3-70b-versatile')
             resp = self.groq_client.chat.completions.create(
+                model=model_name,
                 messages=messages,
                 temperature=0.7,
                 max_tokens=1000
                 content = turn.get("content", "")
                 messages.append({"role": role, "content": content})
             messages.append({"role": "user", "content": user_prompt})
+            # Usar modelo do config
+            model_name = getattr(config, 'TOGETHER_MODEL', 'meta-llama/Llama-3.3-70B-Instruct-Turbo')
             resp = self.together_client.chat.completions.create(
+                model=model_name,
                 messages=messages,
                 temperature=0.7,
                 max_tokens=1000

modules/config.py CHANGED Viewed

@@ -103,12 +103,18 @@ logger = setup_logger()
 def _get_key(name: str) -> str:
     val = os.getenv(name, "").strip()
     if len(val) >= 2:
         if (val.startswith('"') and val.endswith('"')) or (val.startswith("'") and val.endswith("'")):
-            return val[1:-1]
     return val
-MISTRAL_API_KEY: str = _get_key("MISTRAL_API_KEY")
 GEMINI_API_KEY: str = _get_key("GEMINI_API_KEY")
 GROQ_API_KEY: str = _get_key("GROQ_API_KEY")
 GROK_API_KEY: str = _get_key("GROK_API_KEY")
 COHERE_API_KEY: str = _get_key("COHERE_API_KEY")

 def _get_key(name: str) -> str:
     val = os.getenv(name, "").strip()
     if len(val) >= 2:
+        # Remove aspas se existirem (comum em setups de env)
         if (val.startswith('"') and val.endswith('"')) or (val.startswith("'") and val.endswith("'")):
+            val = val[1:-1]
     return val
+# Prioridade Gemini: Se GEMINI_API_KEY existir, ela manda.
+# Se não, tenta GOOGLE_API_KEY.
 GEMINI_API_KEY: str = _get_key("GEMINI_API_KEY")
+if not GEMINI_API_KEY:
+    GEMINI_API_KEY = _get_key("GOOGLE_API_KEY")
+MISTRAL_API_KEY: str = _get_key("MISTRAL_API_KEY")
 GROQ_API_KEY: str = _get_key("GROQ_API_KEY")
 GROK_API_KEY: str = _get_key("GROK_API_KEY")
 COHERE_API_KEY: str = _get_key("COHERE_API_KEY")

modules/local_llm.py CHANGED Viewed

@@ -262,7 +262,8 @@ class LocalLLMFallback:
                 model_route = self._model_path or "mistralai/Mistral-7B-Instruct-v0.3"
                 max_new = max_tokens or self._max_tokens
-                api_url = f"https://api-inference.huggingface.co/models/{model_route}/v1/chat/completions"
                 headers = {"Authorization": f"Bearer {hf_token}", "Content-Type": "application/json"}

                 model_route = self._model_path or "mistralai/Mistral-7B-Instruct-v0.3"
                 max_new = max_tokens or self._max_tokens
+                # Upgrade: Usando o novo endpoint do roteador da HF para evitar Erro 410 (Gone)
+                api_url = f"https://router.huggingface.co/hf-inference/models/{model_route}/v1/chat/completions"
                 headers = {"Authorization": f"Bearer {hf_token}", "Content-Type": "application/json"}

modules/web_search.py CHANGED Viewed

@@ -342,10 +342,24 @@ class WebSearch:
                         return True
         # 4. Contexto do histórico (se usuário estava pedindo info antes)
-        if historico:
-            ultima_5 = " ".join(historico[-5:]).lower()
-            if any(t in ultima_5 for t in ["pesquisa", "busca", "notícia", "aconteceu"]):
-                return True
         return False

                         return True
         # 4. Contexto do histórico (se usuário estava pedindo info antes)
+        if historico and isinstance(historico, list):
+            try:
+                # Conversão ultra-segura: ignora None, extrai de tupla/dict ou converte str
+                historico_limpo = []
+                for h in historico[-5:]:
+                    if h is None: continue
+                    if isinstance(h, tuple) and len(h) > 0:
+                        historico_limpo.append(str(h[0]))
+                    elif isinstance(h, dict):
+                        historico_limpo.append(str(h.get('content', h.get('mensagem', ''))))
+                    else:
+                        historico_limpo.append(str(h))
+                ultima_5 = " ".join(historico_limpo).lower()
+                if any(t in ultima_5 for t in ["pesquisa", "busca", "notícia", "aconteceu", "saber sobre"]):
+                    return True
+            except Exception as e:
+                logger.warning(f"Erro ao processar histórico na busca: {e}")
         return False