Spaces:

caarleexx
/

PARA.AI

Runtime error

App Files Files Community

caarleexx commited on about 1 month ago

Commit

f504c37

verified ·

1 Parent(s): e78ccf9

Update api/processors/processor_llm_base.py

Browse files

Files changed (1) hide show

api/processors/processor_llm_base.py +24 -16

api/processors/processor_llm_base.py CHANGED Viewed

@@ -1,8 +1,8 @@
 """
-Processor Base com integração LLM REAL
-Substitui processamento MOCK por chamadas ao Groq
 """
-from typing import Dict, Any, Optional, List
 from datetime import datetime
 import logging
 from abc import ABC, abstractmethod
@@ -12,7 +12,7 @@ logger = logging.getLogger(__name__)
 class ProcessorLLMBase(ABC):
     """
-    Processor base que integra com LLM real (Groq).
     Substitui hardcoded por prompts e chamadas reais.
     """
@@ -27,7 +27,7 @@ class ProcessorLLMBase(ABC):
         Args:
             specialist_id: ID do especialista (1-9)
             specialist_name: Nome descritivo
-            llm_client: Cliente LLM configurado (GroqClient)
         """
         self.specialist_id = specialist_id
         self.specialist_name = specialist_name
@@ -59,18 +59,20 @@ class ProcessorLLMBase(ABC):
         self,
         prompt: str,
         max_tokens: int = 2048,
-        temperature: float = 0.3
     ) -> str:
         """
-        Faz chamada ao LLM real.
         Args:
             prompt: Prompt a enviar
             max_tokens: Máximo de tokens
             temperature: Temperatura (0-1)
         Returns:
-            Resposta do LLM
         """
         if not self.llm_client:
             self.add_error("LLM client não disponível")
@@ -80,30 +82,36 @@ class ProcessorLLMBase(ABC):
             start_time = datetime.now()
             logger.info(
-                f"[{self.specialist_name}] Chamando LLM... "
                 f"(max_tokens={max_tokens}, temp={temperature})"
             )
-            # Chamada real ao LLM
             response = self.llm_client.generate(
                 prompt=prompt,
-                max_tokens=max_tokens,
-                temperature=temperature
             )
             elapsed = (datetime.now() - start_time).total_seconds()
             self.execution_time += elapsed
             logger.info(
-                f"[{self.specialist_name}] LLM respondeu em {elapsed:.2f}s "
-                f"({len(response)} chars)"
             )
-            return response
         except Exception as e:
             self.add_error(f"Erro ao chamar LLM: {e}")
-            logger.error(f"[{self.specialist_name}] Erro LLM: {e}", exc_info=True)
             return ""
     def add_error(self, error_msg: str):

 """
+Processor Base com integração LLMManager REAL
+Classe abstrata para processors que usam LLM
 """
+from typing import Dict, Any, Optional
 from datetime import datetime
 import logging
 from abc import ABC, abstractmethod
 class ProcessorLLMBase(ABC):
     """
+    Processor base que integra com LLM via client (GroqClient, etc).
     Substitui hardcoded por prompts e chamadas reais.
     """
         Args:
             specialist_id: ID do especialista (1-9)
             specialist_name: Nome descritivo
+            llm_client: Cliente LLM (GroqClient, OpenAIClient, etc)
         """
         self.specialist_id = specialist_id
         self.specialist_name = specialist_name
         self,
         prompt: str,
         max_tokens: int = 2048,
+        temperature: float = 0.3,
+        model: Optional[str] = None
     ) -> str:
         """
+        Faz chamada ao LLM real via client.
         Args:
             prompt: Prompt a enviar
             max_tokens: Máximo de tokens
             temperature: Temperatura (0-1)
+            model: Modelo específico (opcional)
         Returns:
+            Resposta do LLM (texto)
         """
         if not self.llm_client:
             self.add_error("LLM client não disponível")
             start_time = datetime.now()
             logger.info(
+                f"[{self.specialist_name}] 🤖 Chamando LLM... "
                 f"(max_tokens={max_tokens}, temp={temperature})"
             )
+            # Chamada real ao LLM via client
+            # GroqClient.generate() retorna LLMResponse com .content
             response = self.llm_client.generate(
                 prompt=prompt,
+                model=model,  # Opcional, usa default se None
+                temperature=temperature,
+                max_tokens=max_tokens
             )
+            # Extrair conteúdo da resposta
+            # LLMResponse tem atributo .content
+            content = response.content if hasattr(response, 'content') else str(response)
             elapsed = (datetime.now() - start_time).total_seconds()
             self.execution_time += elapsed
             logger.info(
+                f"[{self.specialist_name}] ✅ LLM respondeu em {elapsed:.2f}s "
+                f"({len(content)} chars)"
             )
+            return content
         except Exception as e:
             self.add_error(f"Erro ao chamar LLM: {e}")
+            logger.error(f"[{self.specialist_name}] ❌ Erro LLM: {e}", exc_info=True)
             return ""
     def add_error(self, error_msg: str):