Spaces:

agusansola
/

cora_app

Sleeping

App Files Files Community

agusansola commited on Mar 11

Commit

6d56bb7

1 Parent(s): ee282b8

Add simple audio analysis API for Flutter integration

Browse files

Files changed (3) hide show

.gitignore +8 -0
app.py +137 -0
requirements.txt +5 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,8 @@

+venv/
+.venv/
+__pycache__/
+*.pyc
+.cache/
+.local/
+.env
+.DS_Store

app.py ADDED Viewed

	@@ -0,0 +1,137 @@

+import re #serve per sostituire le parole nel testo
+import gradio as gr #serve per esporre la funzione come app/API
+from transformers import pipeline #serve per usare i modelli in modo semplice
+# LOAD MODELS
+transcriber = pipeline(
+    "automatic-speech-recognition",
+    model="openai/whisper-base"
+)
+ner_model = pipeline(
+    "ner",
+    model="Davlan/xlm-roberta-base-ner-hrl",
+    aggregation_strategy="simple"
+)
+sentiment_model = pipeline(
+    "sentiment-analysis",
+    model="cardiffnlp/twitter-xlm-roberta-base-sentiment"
+)
+# HELPERS - alcuni modelli non restituiscono direttamente positive, negative o neutral, ma codici. Con questa funzione si transformano in parole leggibili.
+def map_sentiment_label(label):
+    label_map = {
+        "LABEL_0": "negative",
+        "LABEL_1": "neutral",
+        "LABEL_2": "positive"
+    }
+    return label_map.get(label, label)
+#funzione di anonimizzazione prende il testo originale, le entità trovate dal NER e sostuisce le entità con placeholder tipo [PER], [LOC], [ORG]
+def anonymize_text(text, entities):
+    anonymized_text = text
+    # Si ordina le entità dalla più lunga alla più corta per evitare sostituzioni parziali sbagliate.
+    sorted_entities = sorted(
+        entities,
+        key=lambda item: len(item["word"]),
+        reverse=True
+    )
+    for entity in sorted_entities:
+        word = entity["word"]
+        entity_group = entity["entity_group"]
+        if word:
+            anonymized_text = re.sub(
+                re.escape(word),
+                f"[{entity_group}]",
+                anonymized_text,
+                flags=re.IGNORECASE
+            )
+    return anonymized_text
+# MAIN FUNCTION - la funzione principale che chiamerà flutter indirettamente tramite lo Space. Riceve il file audio caricato. Se non arriva niente, restituiamo un JSON valido con errore.
+def process_audio(audio_path):
+    if audio_path is None:
+        return {
+            "error": "No audio file provided",
+            "transcription": "",
+            "anonymized_text": "",
+            "entities": [],
+            "sentiment": {
+                "label": "",
+                "score": 0.0
+            }
+        }
+    # Transcription - whisper ascolta l'audio e produce il testo
+    transcription_result = transcriber(audio_path)
+    transcription = transcription_result.get("text", "").strip()
+    #se la trascrizione è vuota, restituisce errore
+    if not transcription:
+        return {
+            "error": "Empty transcription",
+            "transcription": "",
+            "anonymized_text": "",
+            "entities": [],
+            "sentiment": {
+                "label": "",
+                "score": 0.0
+            }
+        }
+    # NER - si passa il testo trascritto al modello NER
+    ner_result = ner_model(transcription)
+    # di trasforma l'output in una lista più pulita
+    entities = []
+    for item in ner_result:
+        entities.append({
+            "entity_group": item.get("entity_group", ""),
+            "word": item.get("word", ""),
+            "score": round(float(item.get("score", 0.0)), 4)
+        })
+    # qui si applica l'anonimizzazione, ovvero le sostituzioni.
+    anonymized_text = anonymize_text(transcription, entities)
+    # Sentiment analysis sul testo anonimizzato
+    sentiment_result = sentiment_model(anonymized_text)[0]
+    sentiment = {
+        "label": map_sentiment_label(sentiment_result.get("label", "")),
+        "score": round(float(sentiment_result.get("score", 0.0)), 4)
+    }
+    # Risposta finale
+    return {
+        "error": "",
+        "transcription": transcription,
+        "anonymized_text": anonymized_text,
+        "entities": entities,
+        "sentiment": sentiment
+    }
+# GRADIO APP
+app = gr.Interface(
+    #usa la funzione process_audio
+    fn=process_audio,
+    #input è un audio
+    inputs=gr.Audio(type="filepath", sources=["upload", "microphone"]),
+    #output è un JSON
+    outputs=gr.JSON(),
+    title="Audio Analysis API",
+    description="Upload an audio file to get transcription, anonymization and sentiment."
+)
+#avvia l'app
+app.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+transformers
+torch
+gradio
+accelerate
+sentencepiece