Spaces:

MrMeeky
/

PixelMind

Sleeping

App Files Files Community

MrMeeky commited on Nov 21, 2025

Commit

ca7238b

verified ·

1 Parent(s): dd28ace

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -29

app.py CHANGED Viewed

@@ -2,34 +2,28 @@ import gradio as gr
 import joblib
 import whisper
 import re
-import nltk
-from nltk.corpus import stopwords
-# --------------------------------------------------------------------------------------------------------------------------------
 # 1. Carregar modelo de sentimento + TF-IDF
-# --------------------------------------------------------------------------------------------------------------------------------
 clf = joblib.load("sentiment_model_logreg.pkl")
 vect = joblib.load("tfidf_vect.pkl")
-# baixar stopwords no ambiente do HF
-nltk.download("stopwords", quiet=True)
-stop_words = set(stopwords.words("portuguese"))
-def clean_text(text):
     text = text.lower()
-    text = re.sub(r"[^a-zA-Zà-úÀ-ÚçÇ ]", " ", text)
-    words = [w for w in text.split() if w not in stop_words]
-    return " ".join(words)
 def predict_sentiment(text):
-    text_clean = clean_text(text)
     X = vect.transform([text_clean])
     pred = clf.predict(X)[0]
     return "POSITIVO" if pred == 1 else "NEGATIVO"
-# --------------------------------------------------------------------------------------------------------------------------------
 # 2. Carregar modelo Whisper
-# --------------------------------------------------------------------------------------------------------------------------------
 whisper_model = whisper.load_model("small")
@@ -37,37 +31,39 @@ def audio_to_text(audio_path):
     result = whisper_model.transcribe(audio_path, fp16=False)
     return result["text"]
-# --------------------------------------------------------------------------------------------------------------------------------
 # 3. Função final do pipeline
-# --------------------------------------------------------------------------------------------------------------------------------
 def pipeline(lista_audios):
     if not lista_audios:
         return []
-    resultados = []
     for audio in lista_audios:
         texto = audio_to_text(audio)
         sentimento = predict_sentiment(texto)
         resultados.append([audio, texto, sentimento])
-    return resultados
-# --------------------------------------------------------------------------------------------------------------------------------
 # 4. Interface Gradio
-# --------------------------------------------------------------------------------------------------------------------------------
 app = gr.Interface(
     fn=pipeline,
-    inputs=gr.Audio(type="filepath", label="Envie seus áudios WAV", multiple=True),
     outputs=gr.Dataframe(
-    headers=["Arquivo", "Texto reconhecido", "Sentimento"],
-    label="Resultados"),
-    ],
     title="Análise de Sentimento por Áudio",
-    description="Faça upload de um áudio WAV. O sistema transcreve o áudio e analisa o sentimento do texto."
 )
-app.launch()

 import joblib
 import whisper
 import re
+# ------------------------------
 # 1. Carregar modelo de sentimento + TF-IDF
+# ------------------------------
 clf = joblib.load("sentiment_model_logreg.pkl")
 vect = joblib.load("tfidf_vect.pkl")
+def preprocess(text):
     text = text.lower()
+    text = re.sub(r"[^a-zà-ú0-9 ]", "", text)
+    return text
 def predict_sentiment(text):
+    text_clean = preprocess(text)
     X = vect.transform([text_clean])
     pred = clf.predict(X)[0]
     return "POSITIVO" if pred == 1 else "NEGATIVO"
+# ------------------------------
 # 2. Carregar modelo Whisper
+# ------------------------------
 whisper_model = whisper.load_model("small")
     result = whisper_model.transcribe(audio_path, fp16=False)
     return result["text"]
+# ------------------------------
 # 3. Função final do pipeline
+# ------------------------------
 def pipeline(lista_audios):
     if not lista_audios:
         return []
+    resultados = []
     for audio in lista_audios:
         texto = audio_to_text(audio)
         sentimento = predict_sentiment(texto)
         resultados.append([audio, texto, sentimento])
+    return resultados
+# ------------------------------
 # 4. Interface Gradio
+# ------------------------------
 app = gr.Interface(
     fn=pipeline,
+    inputs=gr.Audio(
+        type="filepath",
+        label="Envie seus áudios WAV",
+        multiple=True
+    ),
     outputs=gr.Dataframe(
+        headers=["Arquivo", "Texto reconhecido", "Sentimento"],
+        label="Resultados"
+    ),
     title="Análise de Sentimento por Áudio",
+    description="Envie vários áudios WAV. O sistema transcreve cada um deles com Whisper e analisa o sentimento."
 )
+app.launch()