Spaces:

Leches33
/

AI

Sleeping

App Files Files Community

Leches33 commited on Feb 23

Commit

80288b2

verified ·

1 Parent(s): 213cafe

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -17

app.py CHANGED Viewed

@@ -8,12 +8,12 @@ import random
 import numpy as np
 # --- 1. DETERMINISMO TOTAL ---
-# Esto asegura que HF use la misma lógica matemática que tu PC
 def set_seed(seed=42):
     random.seed(seed)
     np.random.seed(seed)
     torch.manual_seed(seed)
-    torch.cuda.manual_seed_all(seed)
 set_seed(42)
@@ -42,7 +42,6 @@ class MiniGPT(nn.Module):
     def forward(self, idx, targets=None):
         B, T = idx.shape
-        # Limitamos el tamaño del bloque para evitar errores de índice
         T = min(T, block_size)
         idx = idx[:, -T:]
@@ -62,53 +61,47 @@ class MiniGPT(nn.Module):
 # --- CARGA DEL MODELO ---
 model = MiniGPT(vocab_size).to(device)
 if os.path.exists("mini_gpt.pth"):
-    # Uso de weights_only=True por seguridad y compatibilidad
-    model.load_state_dict(torch.load("mini_gpt.pth", map_location=device))
 model.eval()
 # --- FUNCIÓN DE RESPUESTA OPTIMIZADA ---
 def responder(mensaje, historial):
-    # Formateamos el prompt exactamente como en el entrenamiento
-    # Usamos marcas claras para que la IA sepa dónde empezar
     contexto = f"### Human: {mensaje}\n### Assistant: "
     tokens = [ord(c) if ord(c) < 256 else 32 for c in contexto]
     ai_txt = ""
     with torch.no_grad():
-        for _ in range(100): # 100 caracteres es suficiente para CPU
             idx = torch.tensor([tokens[-block_size:]], dtype=torch.long).to(device)
             logits, _ = model(idx)
-            # --- GREEDY SEARCH (Cero azar) ---
-            # En lugar de multinomial, usamos argmax para que PC y HF sean gemelos
             next_token = torch.argmax(logits[:, -1, :], dim=-1).item()
             char = chr(next_token)
-            # Frenado de emergencia si empieza a repetir el prompt
             if char == "\n" and len(ai_txt) > 5: break
             if "### Human:" in ai_txt: break
             tokens.append(next_token)
             ai_txt += char
-    # --- LIMPIEZA FINAL ---
-    # Eliminamos cualquier residuo de las etiquetas de entrenamiento
     output = ai_txt.split("###")[0].strip()
-    # Si la respuesta es nula o basura, damos un aviso
     if not output:
         return "Lo siento, todavía estoy aprendiendo de este dataset..."
     return output
 # --- INTERFAZ GRADIO ---
 demo = gr.ChatInterface(
     fn=responder,
     title="Mi IA Personal (Sync Edition)",
     description="Entrenando en PC -> Desplegado en HF. Sincronización de respuestas activa.",
-    examples=["Hola", "¿Qué tal?", "Cuéntame algo"],
-    theme="soft"
 )
 if __name__ == "__main__":

 import numpy as np
 # --- 1. DETERMINISMO TOTAL ---
 def set_seed(seed=42):
     random.seed(seed)
     np.random.seed(seed)
     torch.manual_seed(seed)
+    if torch.cuda.is_available():
+        torch.cuda.manual_seed_all(seed)
 set_seed(42)
     def forward(self, idx, targets=None):
         B, T = idx.shape
         T = min(T, block_size)
         idx = idx[:, -T:]
 # --- CARGA DEL MODELO ---
 model = MiniGPT(vocab_size).to(device)
 if os.path.exists("mini_gpt.pth"):
+    try:
+        model.load_state_dict(torch.load("mini_gpt.pth", map_location=device))
+    except Exception as e:
+        print(f"Error al cargar pesos: {e}")
 model.eval()
 # --- FUNCIÓN DE RESPUESTA OPTIMIZADA ---
 def responder(mensaje, historial):
     contexto = f"### Human: {mensaje}\n### Assistant: "
     tokens = [ord(c) if ord(c) < 256 else 32 for c in contexto]
     ai_txt = ""
     with torch.no_grad():
+        for _ in range(100):
             idx = torch.tensor([tokens[-block_size:]], dtype=torch.long).to(device)
             logits, _ = model(idx)
+            # Greedy Search (Determinista)
             next_token = torch.argmax(logits[:, -1, :], dim=-1).item()
             char = chr(next_token)
             if char == "\n" and len(ai_txt) > 5: break
             if "### Human:" in ai_txt: break
             tokens.append(next_token)
             ai_txt += char
     output = ai_txt.split("###")[0].strip()
     if not output:
         return "Lo siento, todavía estoy aprendiendo de este dataset..."
     return output
 # --- INTERFAZ GRADIO ---
+# Eliminado el argumento 'theme' para evitar el TypeError en el servidor de HF
 demo = gr.ChatInterface(
     fn=responder,
     title="Mi IA Personal (Sync Edition)",
     description="Entrenando en PC -> Desplegado en HF. Sincronización de respuestas activa.",
+    examples=["Hola", "¿Qué tal?", "Cuéntame algo"]
 )
 if __name__ == "__main__":