Spaces:

ProfRod100
/

Teste_Modelo_Amazon

Runtime error

App Files Files Community

ProfRod100 commited on Nov 12, 2025

Commit

81ba821

verified ·

1 Parent(s): 8578fe8

Update app.py

Browse files

Files changed (1) hide show

app.py +109 -232

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import os
-import numpy as np
 import gradio as gr
 import joblib
 from sklearn.pipeline import Pipeline
 from sklearn.feature_extraction.text import TfidfVectorizer
@@ -10,284 +10,161 @@ from sklearn.linear_model import LogisticRegression
 from transformers import pipeline as hf_pipeline
-# ======================================================================
 # 1. Baseline de Sentimentos (TF-IDF + Logistic Regression)
-# ======================================================================
-BASELINE_PATH = os.getenv("MODEL_PATH", "baseline_pipe.pkl")
-def train_small_baseline(save_path: str = BASELINE_PATH,
-                         max_samples: int = 10000):
-    """
-    Treina um baseline pequeno usando uma amostra do dataset amazon_polarity.
-    Usado apenas se baseline_pipe.pkl nao existir no Space.
-    """
     from datasets import load_dataset
     import pandas as pd
     ds = load_dataset("amazon_polarity", split="train")
-    ds_small = ds.shuffle(seed=42).select(range(min(max_samples, len(ds))))
-    df = pd.DataFrame(
-        {"text": ds_small["content"], "label": ds_small["label"]}
-    )
-    pipe = Pipeline(
-        [
-            ("tfidf", TfidfVectorizer(max_features=30000, ngram_range=(1, 2))),
-            ("clf", LogisticRegression(max_iter=1000)),
-        ]
-    )
     pipe.fit(df["text"], df["label"])
     joblib.dump(pipe, save_path)
     return pipe
-def load_or_bootstrap_baseline():
-    """
-    Se existir baseline_pipe.pkl, carrega.
-    Se nao existir e DISABLE_AUTOTRAIN != 1, treina um baseline pequeno.
-    """
     if os.path.exists(BASELINE_PATH):
         return joblib.load(BASELINE_PATH)
-    disable_auto = os.getenv("DISABLE_AUTOTRAIN", "0")
-    if disable_auto == "1":
-        return None
     return train_small_baseline()
-baseline_model = load_or_bootstrap_baseline()
-def classify_only(text: str):
-    """
-    Apenas classifica o sentimento (positivo/negativo) e retorna JSON.
-    """
-    if not text or text.strip() == "":
-        return {"erro": "Digite um texto."}
-    if baseline_model is None:
-        return {
-            "erro": (
-                "Modelo baseline nao encontrado. "
-                "Envie baseline_pipe.pkl na aba Files ou remova DISABLE_AUTOTRAIN."
-            )
-        }
     proba = baseline_model.predict_proba([text])[0]
-    pred = int(np.argmax(proba))
-    label = "positivo" if pred == 1 else "negativo"
     conf = float(np.max(proba))
     return {"sentimento": label, "confianca": round(conf, 3)}
-# ======================================================================
-# 2. IA Generativa (LLaMA 3) para resposta ao cliente
-# ======================================================================
-# ======================================================================
-# 2. IA Generativa (FLAN-T5) para resposta ao cliente
-# ======================================================================
-GEN_MODEL_ID = os.getenv("GEN_MODEL_ID", "google/flan-t5-base")
-# text2text-generation funciona muito bem com FLAN
-generator = hf_pipeline("text2text-generation", model=GEN_MODEL_ID)
-def build_prompt(history, user_text, sentimento_json):
-    """
-    Constroi um prompt amigavel para FLAN-T5, usando historico + sentimento.
-    NENHUMA referencia a processo interno aparece na resposta.
-    """
-    sentimento = None
-    confianca = None
-    if isinstance(sentimento_json, dict):
-        sentimento = sentimento_json.get("sentimento")
-        confianca = sentimento_json.get("confianca")
-    if sentimento is None:
-        sentimento = "nao identificado"
-    # Cabeçalho de instrução (modelo vê, cliente não)
-    prompt = (
-        "Você é um atendente virtual educado, empático e profissional "
-        "de uma loja online. Responda SEMPRE em português do Brasil, "
-        "usando entre 2 e 4 frases curtas, claras e naturais.\n\n"
-        "Informação de contexto (não revele isso na resposta): "
-        f"a última mensagem do cliente foi classificada com sentimento "
-        f"'{sentimento}' (confiança {confianca}). "
-        "Use isso apenas para ajustar o tom (mais empático se negativo, "
-        "mais entusiasmado se positivo), mas não mencione a palavra "
-        "'sentimento', 'classificação' ou 'modelo'.\n\n"
-        "Histórico da conversa:\n"
     )
-    # Histórico anterior
-    if history:
-        for user, bot in history:
-            prompt += f"Cliente: {user}\n"
-            prompt += f"Atendente: {bot}\n"
-    # Nova mensagem
-    prompt += f"Cliente: {user_text}\n"
-    prompt += "Atendente:"
-    return prompt
-def generate_reply_with_history(history, user_text, sentimento_json):
-    """
-    Gera uma resposta levando em conta historico + sentimento,
-    usando FLAN-T5 em modo text2text-generation.
-    """
-    if not user_text or user_text.strip() == "":
-        return "Digite uma mensagem."
-    prompt = build_prompt(history, user_text, sentimento_json)
-    outputs = generator(
-        prompt,
-        max_length=160,
-        do_sample=True,
-        temperature=0.7,
-        top_p=0.9,
-    )
-    reply = outputs[0]["generated_text"]
-    return reply.strip()
-# ======================================================================
-# 3. Função de passo do Chatbot (para o Gradio)
-# ======================================================================
-def chatbot_step(history, user_text):
-    """
-    - Analisa sentimento da nova mensagem
-    - Gera resposta com LLaMA 3
-    - Atualiza historico
-    """
-    if not user_text or user_text.strip() == "":
-        return history, "", {}, history
-    sentiment = classify_only(user_text)
-    reply = generate_reply_with_history(history, user_text, sentiment)
-    if history is None:
-        history = []
-    history = history + [(user_text, reply)]
-    return history, "", sentiment, history
-# ======================================================================
-# 4. Interface Gradio - abas, design e historico
-# ======================================================================
-with gr.Blocks(
-    title="Chatbot de Sentimentos - Professor Rodrigo",
-    theme=gr.themes.Default().set(
-        border_radius="8px",
-        shadow_drop="small",
-        font=["Inter", "system-ui", "sans-serif"],
-    ),
-    css="""
-    #header-markdown h1 { font-size: 1.8rem; }
-    #header-markdown p { font-size: 0.95rem; }
-    """
-) as demo:
     gr.Markdown(
         """
-<div id="header-markdown">
 # Chatbot de Sentimentos (ML + IA Generativa)
-**Professor Rodrigo** — Projeto Final de Machine Learning & Deep Learning
-- Classificação: TF-IDF + Regressão Logística (baseline).
-- Geração: modelo `LLaMA 3` (Instruct) para respostas em PT-BR.
-> Dica didática: envie **`baseline_pipe.pkl`** na aba *Files* do Space
-> para usar um modelo de sentimentos treinado pelo seu grupo.
-</div>
-        """,
-        elem_id="header-markdown",
-    )
-    with gr.Tab("Análise de Sentimento (isolada)"):
-        with gr.Row():
-            with gr.Column(scale=3):
-                input_text = gr.Textbox(
-                    label="Digite uma avaliação de produto",
-                    lines=5,
-                    placeholder=(
-                        "Ex.: O produto chegou rápido e superou minhas expectativas "
-                        "ou: O produto chegou quebrado, estou muito chateado."
-                    ),
-                )
-                btn_analisar = gr.Button("Analisar sentimento", variant="primary")
-            with gr.Column(scale=2):
-                output_json = gr.JSON(
-                    label="Resultado da classificação (baseline)",
-                )
-        btn_analisar.click(classify_only, inputs=input_text, outputs=output_json)
-    with gr.Tab("Chatbot (Análise + Resposta com histórico)"):
-        with gr.Row():
-            with gr.Column(scale=3):
-                chat_history = gr.Chatbot(
-                    label="Conversa com o atendente virtual",
-                    height=400,
-                )
-                user_input = gr.Textbox(
-                    label="Mensagem do cliente",
-                    lines=4,
-                    placeholder="Ex.: Estou chateado, o produto é ruim.",
-                )
-                with gr.Row():
-                    send_btn = gr.Button("Enviar", variant="primary")
-                    clear_btn = gr.Button("Limpar conversa")
-            with gr.Column(scale=2):
-                last_sentiment = gr.JSON(
-                    label="Sentimento da última mensagem",
-                )
-                gr.Markdown(
-                    """
-**Como funciona esta aba?**
-1. O cliente envia uma mensagem.
-2. O baseline classifica o sentimento (positivo/negativo).
-3. O modelo LLaMA 3 gera uma resposta empática, usando o sentimento apenas como contexto.
-4. O histórico da conversa é mantido e influencia as respostas seguintes.
-                    """
-                )
-        state_history = gr.State([])
-        send_btn.click(
-            chatbot_step,
-            inputs=[state_history, user_input],
-            outputs=[chat_history, user_input, last_sentiment, state_history],
-        )
-        def clear_chat():
-            return [], {}, []
-        clear_btn.click(
-            clear_chat,
-            inputs=None,
-            outputs=[chat_history, last_sentiment, state_history],
-        )
-if __name__ == "__main__":
-    demo.launch()

 import os
 import gradio as gr
 import joblib
+import numpy as np
 from sklearn.pipeline import Pipeline
 from sklearn.feature_extraction.text import TfidfVectorizer
 from transformers import pipeline as hf_pipeline
+# ============================================================
 # 1. Baseline de Sentimentos (TF-IDF + Logistic Regression)
+# ============================================================
+BASELINE_PATH = "baseline_pipe.pkl"
+def train_small_baseline(save_path=BASELINE_PATH, max_samples=8000):
+    """Treina um baseline pequeno (caso o aluno não envie o .pkl)."""
     from datasets import load_dataset
     import pandas as pd
     ds = load_dataset("amazon_polarity", split="train")
+    ds_small = ds.shuffle(seed=42).select(range(max_samples))
+    df = pd.DataFrame({"text": ds_small["content"], "label": ds_small["label"]})
+    pipe = Pipeline([
+        ("tfidf", TfidfVectorizer(max_features=25000, ngram_range=(1, 2))),
+        ("clf", LogisticRegression(max_iter=1200)),
+    ])
     pipe.fit(df["text"], df["label"])
     joblib.dump(pipe, save_path)
     return pipe
+def load_baseline():
     if os.path.exists(BASELINE_PATH):
         return joblib.load(BASELINE_PATH)
     return train_small_baseline()
+baseline_model = load_baseline()
+def classify_sentiment(text):
+    if not text.strip():
+        return {"erro": "Digite algo para analisar."}
     proba = baseline_model.predict_proba([text])[0]
+    label = "positivo" if np.argmax(proba) == 1 else "negativo"
     conf = float(np.max(proba))
     return {"sentimento": label, "confianca": round(conf, 3)}
+# ============================================================
+# 2. IA Generativa — LLaMA-3-8B-Instruct
+# ============================================================
+GEN_MODEL = "meta-llama/Meta-Llama-3-8B-Instruct"
+generator = hf_pipeline(
+    "text-generation",
+    model=GEN_MODEL,
+    max_new_tokens=180,
+    temperature=0.5,
+    top_p=0.9
+)
+SYSTEM_PROMPT = """
+Você é um atendente virtual profissional, educado e empático.
+Responda sempre em português do Brasil, de forma natural
+e sem mencionar que é uma IA. Nunca justifique o processo interno.
+"""
+def build_final_prompt(history, user_msg, sentimento_json):
+    sentimento = sentimento_json.get("sentimento", "neutro")
+    if sentimento == "negativo":
+        intent = """
+O cliente está insatisfeito. Mostre empatia, peça desculpas,
+demonstre interesse em resolver e peça informações adicionais.
+"""
+    elif sentimento == "positivo":
+        intent = """
+O cliente está satisfeito. Agradeça com entusiasmo,
+reforce os pontos positivos e demonstre proximidade.
+"""
+    else:
+        intent = """
+Sentimento indefinido. Responda de forma neutra, cordial e prestativa.
+"""
+    history_text = "\n".join(
+        [f"Cliente: {msg[0]}\nAtendente: {msg[1]}" for msg in history]
     )
+    final_prompt = f"""
+{SYSTEM_PROMPT}
+Contexto da conversa:
+{history_text}
+Instruções:
+{intent}
+Mensagem do cliente:
+"{user_msg}"
+Gere uma resposta natural, com 2 a 4 frases.
+"""
+    return final_prompt
+def chat_generate(history, user_input):
+    if not user_input.strip():
+        return history, "Digite uma mensagem."
+    sentimento = classify_sentiment(user_input)
+    final_prompt = build_final_prompt(history, user_input, sentimento)
+    result = generator(final_prompt)[0]["generated_text"]
+    # Extrair somente a resposta final (remove prompt repetido)
+    if final_prompt in result:
+        result = result.split(final_prompt)[-1].strip()
+    history.append((user_input, result))
+    return history, result
+# ============================================================
+# 3. Interface Gradio (compatível com HF antigo)
+# ============================================================
+with gr.Blocks(title="Chatbot de Sentimentos - Prof. Rodrigo", theme=gr.themes.Default()) as demo:
     gr.Markdown(
         """
 # Chatbot de Sentimentos (ML + IA Generativa)
+**Professor Rodrigo — Projeto Final ML & DL**
+- Classificação de sentimento com TF-IDF + Regressão Logística
+- Respostas naturais geradas por LLaMA-3-8B-Instruct
+- Suporte a histórico de conversa
+- Envie `baseline_pipe.pkl` na aba **Files** caso tenha treinado seu próprio modelo
+        """
+    )
+    with gr.Tab("Análise de Sentimento"):
+        text_in = gr.Textbox(label="Digite um comentário", lines=4)
+        text_out = gr.JSON(label="Resultado")
+        btn_analisar = gr.Button("Analisar sentimento")
+        btn_analisar.click(classify_sentiment, inputs=text_in, outputs=text_out)
+    with gr.Tab("Chatbot (Conversação + Resposta)"):
+        chatbot = gr.Chatbot(label="Histórico de conversa")
+        user_box = gr.Textbox(label="Mensagem do cliente", lines=3)
+        send_btn = gr.Button("Enviar e gerar resposta")
+        send_btn.click(chat_generate,
+                       inputs=[chatbot, user_box],
+                       outputs=[chatbot, user_box])
+demo.launch()