Spaces:

tecuhtli
/

Mori_Bot

Running

App Files Files Community

tecuhtli commited on 12 days ago

Commit

9c8e3d6

1 Parent(s): 6ff6e86

Actualizando la version para entrega de Mori

Browse files

Files changed (2) hide show

Mori_TechnicalPrompts.py +157 -2
requirements.txt +4 -1

Mori_TechnicalPrompts.py CHANGED Viewed

@@ -7,7 +7,7 @@ import unicodedata
 import re
 from Mori_Chatbot_SpanishCorrections import polish_spanish
 from Mori_Technical_RAGwithFAISS import retrieve_docs
-import os
 import warnings
 # ************************************************************************
 # Defining default paths for the model to work
@@ -15,11 +15,36 @@ import warnings
 os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
 warnings.filterwarnings("ignore", category=UserWarning)
 warnings.filterwarnings("ignore", category=FutureWarning)
 #=====================================================================================
 # Functions  =========================================================================
 #=====================================================================================
 def normalize_text(text: str) -> str:
@@ -196,6 +221,136 @@ def answer_with_mori_plain(tokenizer, model, question: str, modo: str = "exacto"
     return polish_spanish(raw_answer), prompt
 def get_gen_kwargs(modo="exacto"):
     """Selecting the Mori personaliuty by using different hyperparameters settigns"""

 import re
 from Mori_Chatbot_SpanishCorrections import polish_spanish
 from Mori_Technical_RAGwithFAISS import retrieve_docs
+import os, torch
 import warnings
 # ************************************************************************
 # Defining default paths for the model to work
 os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
 warnings.filterwarnings("ignore", category=UserWarning)
 warnings.filterwarnings("ignore", category=FutureWarning)
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 #=====================================================================================
 # Functions  =========================================================================
 #=====================================================================================
+def recortar_ultima_oracion(texto):
+    """Remove incomplete generated text"""
+    texto = texto.strip()
+    if not texto:
+        return texto
+    # signos válidos de cierre
+    signos = ".?!…"
+    # encontrar la última posición
+    posiciones = [texto.rfind(s) for s in signos]
+    posiciones = [p for p in posiciones if p != -1]
+    if not posiciones:
+        return texto  # no hay signos → lo regresamos
+    final = max(posiciones)
+    # aseguramos que no sea demasiado pronto
+    if final < len(texto) * 0.3:
+        return texto
+    return texto[:final + 1].strip()
 def normalize_text(text: str) -> str:
     return polish_spanish(raw_answer), prompt
+def build_qwen_system_prompt(persona: str) -> str:
+    """Generates prompts based on the model personality"""
+    p = (persona or "").lower()
+    base = (
+        "Eres Mori Técnico, un asistente de ciencia de datos. "
+        "Respondes siempre en español de México, con explicaciones claras y amables. "
+    )
+    if "exacto" in p:
+        return (
+            base +
+            "Respondes de forma muy breve, directa y precisa, "
+            "en un solo párrafo de máximo 64 palabras, sin listas ni numeración."
+        )
+    elif "creativo" in p:
+        return (
+            base +
+            "Respondes de forma creativa y entusiasta, con un tono cálido y motivador, "
+            "en un solo párrafo de máximo 92 palabras, evitando listas y numeración."
+        )
+    else:
+        return (
+            base +
+            "Respondes de forma breve, clara y natural, "
+            "en un solo párrafo y evitando listas y numeración."
+        )
+def answer_with_qwen_base(
+    tokenizer,
+    model,
+    user_question: str,
+    persona: str = "Mori Técnico",
+    max_new_tokens: int = 64,
+) -> str:
+    """
+    Genera una respuesta usando Qwen base, sin RAG ni fine-tuning.
+    - Ajusta el estilo según la personalidad (exacto / creativo).
+    - Usa max_new_tokens para controlar el largo de la respuesta.
+    """
+    if not user_question.strip():
+        return "Necesito que me cuentes algo para poder ayudarte 🙂."
+    system_prompt = build_qwen_system_prompt(persona)
+    used_chat_template = False
+    # 1) Construimos el prompt de texto
+    if hasattr(tokenizer, "apply_chat_template"):
+        used_chat_template = True
+        messages = [
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": user_question.strip()},
+        ]
+        # devolvemos string, no tensores
+        prompt = tokenizer.apply_chat_template(
+            messages,
+            tokenize=False,
+            add_generation_prompt=True,
+        )
+    else:
+        prompt = (
+            f"system {system_prompt}\n"
+            f"user {user_question.strip()}\n"
+            f"assistant "
+        )
+    # 2) Tokenizar el prompt
+    inputs = tokenizer(
+        prompt,
+        return_tensors="pt"
+    ).to(device)
+    gen_kwargs = get_gen_kwargs(persona)
+    # 3) Generar (aquí usamos max_new_tokens que viene de la UI)
+    with torch.no_grad():
+        if persona == 'exacto':
+            output_ids = model.generate(
+                **inputs,
+                max_new_tokens=64,
+                do_sample=True,
+                temperature=0.2,
+                num_beams=1,
+                top_p=0.8,
+                pad_token_id=tokenizer.eos_token_id,
+            )
+        elif persona =='creativo':
+            output_ids = model.generate(
+                **inputs,
+                max_new_tokens=256,
+                do_sample=True,
+                temperature=0.9,
+                num_beams=1,
+                top_p=0.9,
+                pad_token_id=tokenizer.eos_token_id,
+            )
+    text = tokenizer.decode(output_ids[0], skip_special_tokens=True)
+    # 4) Recortar el prompt de la salida
+    cleaned = text
+    if used_chat_template:
+        if cleaned.startswith(prompt):
+            cleaned = cleaned[len(prompt):].strip()
+        else:
+            lower = cleaned.lower()
+            marker = "assistant"
+            idx = lower.rfind(marker)
+            if idx != -1:
+                cleaned = cleaned[idx + len(marker):].strip()
+    else:
+        if cleaned.startswith(prompt):
+            cleaned = cleaned[len(prompt):].strip()
+        else:
+            lower = cleaned.lower()
+            marker = "assistant"
+            idx = lower.rfind(marker)
+            if idx != -1:
+                cleaned = cleaned[idx + len(marker):].strip()
+    cleaned = recortar_ultima_oracion(cleaned)
+    return cleaned.strip(), prompt
 def get_gen_kwargs(modo="exacto"):
     """Selecting the Mori personaliuty by using different hyperparameters settigns"""

requirements.txt CHANGED Viewed

@@ -9,4 +9,7 @@ torch==2.6.0
 joblib
 sentence-transformers
 faiss-cpu
-ujson

 joblib
 sentence-transformers
 faiss-cpu
+ujson
+accelerate
+numpy
+protobuf