Spaces:

TeszenAI
/

MTP-3space

Sleeping

App Files Files Community

teszenofficial commited on Apr 8

Commit

8cd8259

verified ·

1 Parent(s): 470d2fa

Upload app.py

Browse files

Files changed (1) hide show

app.py +120 -19

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ import torch
 import json
 import time
 import gc
 from fastapi import FastAPI, Request
 from fastapi.responses import HTMLResponse, StreamingResponse
 from fastapi.middleware.cors import CORSMiddleware
@@ -33,6 +34,97 @@ torch.set_grad_enabled(False)
 # CAMBIA ESTO POR EL NOMBRE DE TU REPO EN HUGGING FACE
 MODEL_REPO = "TeszenAI/MTP-3"  # <-- CAMBIA A TU REPO
 # ======================
 # DEFINIR ARQUITECTURA DEL MODELO (MTP)
 # ======================
@@ -144,11 +236,14 @@ class MTPModel(nn.Module):
         logits = self.lm_head(x)
         return logits
-    def generate(self, input_ids, max_new_tokens=100, temperature=0.8, top_k=50, top_p=0.9, repetition_penalty=1.1):
-        """Método de generación compatible con la interfaz"""
         generated = input_ids
-        for _ in range(max_new_tokens):
             with torch.no_grad():
                 logits = self(generated)
                 next_logits = logits[0, -1, :] / temperature
@@ -177,6 +272,13 @@ class MTPModel(nn.Module):
                 break
             generated = torch.cat([generated, torch.tensor([[next_token]], device=generated.device)], dim=1)
         return generated
@@ -350,6 +452,9 @@ async def generate(req: PromptRequest):
         if "###" in response:
             response = response.split("###")[0].strip()
         return {
             "reply": response,
@@ -394,7 +499,7 @@ def model_info():
     }
 # ======================
-# INTERFAZ WEB (MODERNA)
 # ======================
 @app.get("/", response_class=HTMLResponse)
 def chat_ui():
@@ -451,12 +556,11 @@ header {
     width: 32px;
     height: 32px;
     border-radius: 50%;
-    background: linear-gradient(135deg, #4a9eff, #7c3aed);
-    display: flex;
-    align-items: center;
-    justify-content: center;
-    font-weight: bold;
-    font-size: 14px;
 }
 .brand-text {
     font-weight: 500;
@@ -523,12 +627,10 @@ header {
     height: 34px;
     min-width: 34px;
     border-radius: 50%;
-    background: linear-gradient(135deg, #4a9eff, #7c3aed);
-    display: flex;
-    align-items: center;
-    justify-content: center;
-    font-weight: bold;
-    font-size: 14px;
     box-shadow: 0 2px 6px rgba(0,0,0,0.2);
 }
 .bot-actions {
@@ -630,7 +732,7 @@ header {
 <body>
 <header>
     <div class="brand-wrapper" onclick="location.reload()">
-        <div class="brand-logo">MTP</div>
         <div class="brand-text">
             MTP <span class="version-badge">v1</span>
         </div>
@@ -638,7 +740,7 @@ header {
 </header>
 <div id="chatScroll" class="chat-scroll">
     <div class="msg-row bot" style="animation-delay: 0.1s;">
-        <div class="bot-avatar">M</div>
         <div class="msg-content-wrapper">
             <div class="msg-text">
                 ¡Hola! Soy MTP, tu asistente de IA. ¿En qué puedo ayudarte hoy?
@@ -712,7 +814,6 @@ async function sendMessage(textOverride = null) {
     botRow.className = 'msg-row bot';
     const avatar = document.createElement('div');
     avatar.className = 'bot-avatar pulsing';
-    avatar.textContent = 'M';
     const wrapper = document.createElement('div');
     wrapper.className = 'msg-content-wrapper';
     const msgText = document.createElement('div');

 import json
 import time
 import gc
+import re
 from fastapi import FastAPI, Request
 from fastapi.responses import HTMLResponse, StreamingResponse
 from fastapi.middleware.cors import CORSMiddleware
 # CAMBIA ESTO POR EL NOMBRE DE TU REPO EN HUGGING FACE
 MODEL_REPO = "TeszenAI/MTP-3"  # <-- CAMBIA A TU REPO
+# ======================
+# FUNCIONES DE LIMPIEZA Y CONTROL DE CALIDAD
+# ======================
+def clean_response(text: str) -> str:
+    """
+    Limpia la respuesta eliminando repeticiones, frases sin sentido y
+    asegurando que termine correctamente.
+    """
+    if not text:
+        return ""
+    # 1. Eliminar repeticiones excesivas de palabras o frases cortas
+    words = text.split()
+    cleaned_words = []
+    last_phrase = ""
+    repeat_count = 0
+    for word in words:
+        if word == last_phrase:
+            repeat_count += 1
+            if repeat_count > 2:  # Si repite más de 2 veces seguidas
+                continue
+        else:
+            last_phrase = word
+            repeat_count = 0
+        cleaned_words.append(word)
+    text = " ".join(cleaned_words)
+    # 2. Eliminar patrones sin sentido (repeticiones de letras, caracteres raros)
+    text = re.sub(r'(.)\1{4,}', r'\1\1', text)  # aaa... -> aa
+    text = re.sub(r'[^a-zA-ZáéíóúñüÁÉÍÓÚÑÜ0-9\s.,;:!?¿¡()\-"]+', '', text)
+    # 3. Cortar en la primera frase que parezca final coherente
+    stop_patterns = [
+        r'(\.\s*)$',           # Punto final
+        r'[.!?](\s+)?$',       # Fin de oración
+        r'(gracias|hasta luego|adiós|saludos|fin|fin del mensaje)$',
+        r'(¿algo más\?|¿necesitas algo más\?|¿en qué más puedo ayudarte\?)'
+    ]
+    for pattern in stop_patterns:
+        match = re.search(pattern, text, re.IGNORECASE)
+        if match:
+            # Cortar justo después del patrón de finalización
+            end_pos = match.end()
+            text = text[:end_pos]
+            break
+    # 4. Si la respuesta es muy corta o vacía, devolver mensaje por defecto
+    if len(text.strip()) < 10:
+        return "Lo siento, no pude generar una respuesta clara. ¿Podrías reformular tu pregunta?"
+    # 5. Eliminar espacios múltiples y saltos de línea excesivos
+    text = re.sub(r'\s+', ' ', text).strip()
+    return text
+def should_stop_generation(generated_text: str, min_length: int = 30, max_length: int = 300) -> bool:
+    """
+    Determina si debemos detener la generación basado en el texto generado.
+    """
+    # Si ya superamos la longitud máxima
+    if len(generated_text) > max_length:
+        return True
+    # Si es muy corto y no hay puntuación final
+    if len(generated_text) < min_length and not re.search(r'[.!?]$', generated_text):
+        return False
+    # Señales de que ya terminó la respuesta
+    stop_signals = [
+        r'(gracias por tu pregunta|espero haberte ayudado|¿necesitas algo más\?)',
+        r'(hasta luego|adiós|quedo atento|saludos cordiales)',
+        r'(fin del mensaje|fin de la conversación)'
+    ]
+    for signal in stop_signals:
+        if re.search(signal, generated_text, re.IGNORECASE):
+            return True
+    # Si la última frase parece completa
+    last_sentence = generated_text.split('.')[-1].strip()
+    if len(last_sentence) > 5 and re.search(r'[.!?]$', last_sentence):
+        # Y ya hemos generado suficiente contenido
+        if len(generated_text) > min_length:
+            return True
+    return False
 # ======================
 # DEFINIR ARQUITECTURA DEL MODELO (MTP)
 # ======================
         logits = self.lm_head(x)
         return logits
+    def generate(self, input_ids, max_new_tokens=150, temperature=0.8, top_k=50, top_p=0.9, repetition_penalty=1.1):
+        """Método de generación mejorado con detección inteligente de fin"""
         generated = input_ids
+        generated_text = ""
+        min_response_length = 30
+        max_response_length = max_new_tokens * 2
+        for step in range(max_new_tokens):
             with torch.no_grad():
                 logits = self(generated)
                 next_logits = logits[0, -1, :] / temperature
                 break
             generated = torch.cat([generated, torch.tensor([[next_token]], device=generated.device)], dim=1)
+            # Decodificar parcialmente para verificar si debemos parar (solo cada 10 pasos para eficiencia)
+            if step > 10 and step % 10 == 0:
+                # Intentar decodificar tokens generados (esto es aproximado, el tokenizador real está fuera)
+                if len(generated[0]) > 10:
+                    if should_stop_generation(str(generated[0].tolist()), min_response_length, max_response_length):
+                        break
         return generated
         if "###" in response:
             response = response.split("###")[0].strip()
+        # Aplicar limpieza inteligente a la respuesta
+        response = clean_response(response)
         return {
             "reply": response,
     }
 # ======================
+# INTERFAZ WEB (MODERNA CON LOGO INTEGRADO)
 # ======================
 @app.get("/", response_class=HTMLResponse)
 def chat_ui():
     width: 32px;
     height: 32px;
     border-radius: 50%;
+    background-image: url('https://i.postimg.cc/c4BRhSnR/8F838209-6DD9-4E1C-96BB-621EC3B78E68.png');
+    background-size: cover;
+    background-position: center;
+    background-repeat: no-repeat;
+    border: 1px solid rgba(255,255,255,0.1);
 }
 .brand-text {
     font-weight: 500;
     height: 34px;
     min-width: 34px;
     border-radius: 50%;
+    background-image: url('https://i.postimg.cc/c4BRhSnR/8F838209-6DD9-4E1C-96BB-621EC3B78E68.png');
+    background-size: cover;
+    background-position: center;
+    background-repeat: no-repeat;
     box-shadow: 0 2px 6px rgba(0,0,0,0.2);
 }
 .bot-actions {
 <body>
 <header>
     <div class="brand-wrapper" onclick="location.reload()">
+        <div class="brand-logo"></div>
         <div class="brand-text">
             MTP <span class="version-badge">v1</span>
         </div>
 </header>
 <div id="chatScroll" class="chat-scroll">
     <div class="msg-row bot" style="animation-delay: 0.1s;">
+        <div class="bot-avatar"></div>
         <div class="msg-content-wrapper">
             <div class="msg-text">
                 ¡Hola! Soy MTP, tu asistente de IA. ¿En qué puedo ayudarte hoy?
     botRow.className = 'msg-row bot';
     const avatar = document.createElement('div');
     avatar.className = 'bot-avatar pulsing';
     const wrapper = document.createElement('div');
     wrapper.className = 'msg-content-wrapper';
     const msgText = document.createElement('div');