Spaces:

gnosticdev
/

interferencia-arconte

Sleeping

App Files Files Community

gnosticdev commited on Mar 9

Commit

142f56f

verified ·

1 Parent(s): 1e62b0b

Update app.py

Browse files

Files changed (1) hide show

app.py +99 -85

app.py CHANGED Viewed

@@ -4,90 +4,104 @@ import librosa
 from scipy.signal import find_peaks
 from sklearn.cluster import KMeans
-def decodificar(audio):
-    if audio is None:
-        return "No audio"
-    path = audio
-    y, sr = librosa.load(path, sr=None)
-    frame = int(sr * 0.04)
-    stft = np.abs(
-        librosa.stft(
-            y,
-            n_fft=frame*2,
-            hop_length=frame
-        )
-    )
-    freqs = librosa.fft_frequencies(sr=sr)
-    tonos = []
-    for f in stft.T:
-        if np.max(f) == 0:
-            continue
-        f = f / np.max(f)
-        peaks, _ = find_peaks(f, height=0.2)
-        if len(peaks) == 0:
-            continue
-        peak_freqs = freqs[peaks]
-        peak_freqs = peak_freqs[
-            (peak_freqs > 300) &
-            (peak_freqs < 4000)
-        ]
-        if len(peak_freqs):
-            tonos.append(peak_freqs[0])
-    if len(tonos) < 10:
-        return "Sin señal tonal clara"
-    tonos = np.array(tonos).reshape(-1,1)
-    kmeans = KMeans(n_clusters=12, n_init=10)
-    kmeans.fit(tonos)
-    centros = sorted(kmeans.cluster_centers_.flatten())
-    letras = "ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789"
-    texto=""
-    for f in tonos.flatten():
-        cercano = min(centros, key=lambda x: abs(x-f))
-        idx = centros.index(cercano)
-        if idx < len(letras):
-            texto += letras[idx]
-    return texto
 with gr.Blocks() as demo:
-    gr.Markdown("# Decodificador de tonos estilo radio digital")
-    audio = gr.Audio(type="filepath")
-    boton = gr.Button("Decodificar")
-    salida = gr.Textbox(lines=10)
-    boton.click(
-        decodificar,
-        inputs=audio,
-        outputs=salida
-    )
-demo.launch()

 from scipy.signal import find_peaks
 from sklearn.cluster import KMeans
+class DigitalToneDecoder:
+    def __init__(self, frame_ms=40, min_freq=300, max_freq=4000, peak_threshold=0.2, symbols=16):
+        self.frame_ms = frame_ms
+        self.min_freq = min_freq
+        self.max_freq = max_freq
+        self.peak_threshold = peak_threshold
+        self.symbols = symbols
+    def cargar_audio(self, path):
+        y, sr = librosa.load(path, sr=None, mono=True)
+        self.sr = sr
+        self.y = y
+        return y, sr
+    def calcular_stft(self):
+        frame = int(self.sr * self.frame_ms / 1000)
+        stft = np.abs(librosa.stft(self.y, n_fft=frame*2, hop_length=frame, window="hann"))
+        freqs = librosa.fft_frequencies(sr=self.sr)
+        return stft, freqs
+    def detectar_tonos(self, stft, freqs):
+        tonos = []
+        for frame in stft.T:
+            if np.max(frame) == 0:
+                continue
+            frame = frame / np.max(frame)
+            peaks, _ = find_peaks(frame, height=self.peak_threshold)
+            if len(peaks) == 0:
+                continue
+            peak_freqs = freqs[peaks]
+            peak_freqs = peak_freqs[(peak_freqs > self.min_freq) & (peak_freqs < self.max_freq)]
+            if len(peak_freqs):
+                tonos.append(peak_freqs[0])
+        return np.array(tonos)
+    def crear_simbolos(self, tonos):
+        if len(tonos) < self.symbols:
+            return sorted(tonos)
+        tonos = tonos.reshape(-1, 1)
+        kmeans = KMeans(n_clusters=self.symbols, n_init=10)
+        kmeans.fit(tonos)
+        return sorted(kmeans.cluster_centers_.flatten())
+    def decodificar(self, tonos, centros):
+        letras = "ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789 "
+        texto = ""
+        for f in tonos:
+            cercano = min(centros, key=lambda x: abs(x - f))
+            idx = centros.index(cercano)
+            texto += letras[idx % len(letras)]
+        return texto
+def analizar(audio_path, progress=gr.Progress()):
+    if audio_path is None:
+        return "⚠️ No hay audio"
+    progress(0.2, desc="Cargando audio...")
+    decoder = DigitalToneDecoder()
+    decoder.cargar_audio(audio_path)
+    progress(0.4, desc="Calculando STFT...")
+    stft, freqs = decoder.calcular_stft()
+    progress(0.6, desc="Detectando tonos...")
+    tonos = decoder.detectar_tonos(stft, freqs)
+    if len(tonos) == 0:
+        return "💤 No se detectaron tonos en el rango útil (300-4000Hz)"
+    progress(0.8, desc="Agrupando frecuencias...")
+    centros = decoder.crear_simbolos(tonos)
+    progress(1.0, desc="Decodificando...")
+    texto = decoder.decodificar(tonos, centros)
+    reporte = f"📊 **DATOS TÉCNICOS:**\n"
+    reporte += f"- Tonos detectados: {len(tonos)}\n"
+    reporte += f"- Clusters únicos: {len(centros)}\n"
+    reporte += f"- Frecuencias base: {[f'{c:.1f}Hz' for c in centros]}\n\n"
+    reporte += f"🔤 **SECUENCIA DECODIFICADA:**\n\n`{texto}`\n\n"
+    reporte += f"*Nota: Las letras se asignan por cluster de frecuencia, no por voz humana.*"
+    return reporte
 with gr.Blocks() as demo:
+    gr.Markdown("""
+    # 📡 Decodificador de Tonos Digitales (DSP Real)
+    ## STFT + Detección de Picos + KMeans Clustering
+    *Basado en modos digitales de radio (PSK31, RTTY).*
+    *Decodifica frecuencias dominantes a símbolos. La interpretación es tuya.*
+    """)
+    audio = gr.Audio(label="Audio", type="filepath", sources=["upload", "microphone"])
+    btn = gr.Button("Decodificar", variant="primary")
+    output = gr.Textbox(label="Resultado", lines=12)
+    btn.click(analizar, inputs=audio, outputs=output)
+if __name__ == "__main__":
+    demo.launch()