Spaces:

not-lain
/

ggwave

Running

App Files Files Community

not-lain commited on Feb 17

Commit

cab8d03

verified ·

1 Parent(s): 9081ee2

baseline

Browse files

Files changed (4) hide show

.gitattributes +1 -0
app.py +133 -0
audio.wav +3 -0
requirements.txt +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+audio.wav filter=lfs diff=lfs merge=lfs -text

app.py ADDED Viewed

	@@ -0,0 +1,133 @@

+import ggwave
+import gradio as gr
+import numpy as np
+def encode_text_to_audio(text, protocol_id=1, volume=20):
+    """
+    Encode text to audio waveform using ggwave
+    Args:
+        text: Text to encode
+        protocol_id: ggwave protocol (0-8, default 1)
+        volume: Audio volume (0-100, default 20)
+    Returns:
+        Tuple of (sample_rate, audio_data) for Gradio audio output
+    """
+    if not text:
+        return None
+    try:
+        waveform = ggwave.encode(text, protocolId=protocol_id, volume=volume)
+        audio_data = np.frombuffer(waveform, dtype=np.float32)
+        return 48000, audio_data
+    except Exception as e:
+        raise gr.Error(f"Encoding failed: {str(e)}")
+def decode_audio_to_text(audio_data):
+    """
+    Decode audio waveform to text using ggwave
+    Args:
+        audio_data: Tuple of (sample_rate, audio_array) from Gradio
+    Returns:
+        Decoded text string
+    """
+    if audio_data is None:
+        return "No audio provided"
+    try:
+        sample_rate, audio = audio_data
+        if audio.dtype != np.float32:
+            audio = audio.astype(np.float32)
+        if sample_rate != 48000:
+            duration = len(audio) / sample_rate
+            new_length = int(duration * 48000)
+            audio = np.interp(
+                np.linspace(0, len(audio), new_length), np.arange(len(audio)), audio
+            )
+        instance = ggwave.init()
+        chunk_size = 1024
+        decoded_text = ""
+        for i in range(0, len(audio), chunk_size):
+            chunk = audio[i : i + chunk_size]
+            chunk_bytes = chunk.tobytes()
+            res = ggwave.decode(instance, chunk_bytes)
+            if res is not None:
+                try:
+                    decoded_text = res.decode("utf-8")
+                    break
+                except:
+                    pass
+        ggwave.free(instance)
+        if decoded_text:
+            return f"✅ Decoded: {decoded_text}"
+        else:
+            return "❌ No ggwave signal detected in audio"
+    except Exception as e:
+        return f"❌ Decoding failed: {str(e)}"
+encode_interface = gr.Interface(
+    fn=encode_text_to_audio,
+    inputs=[
+        gr.Textbox(
+            label="Text to Encode",
+            placeholder="Enter text to convert to audio...",
+            lines=3,
+        ),
+        gr.Slider(
+            minimum=0,
+            maximum=8,
+            value=1,
+            step=1,
+            label="Protocol ID",
+            info="ggwave protocol (0-8, affects speed/reliability)",
+        ),
+        gr.Slider(
+            minimum=0,
+            maximum=100,
+            value=20,
+            step=1,
+            label="Volume",
+            info="Audio volume (0-100)",
+        ),
+    ],
+    outputs=gr.Audio(label="Generated Audio", type="numpy"),
+    title="📤 Encode Text to Audio",
+    description="Convert text into an audio signal using ggwave protocol",
+    examples=[
+        ["Hello World", 1, 20],
+        ["GGWave is cool!", 1, 30],
+        ["Testing 123", 2, 25],
+    ],
+    theme="default",
+)
+decode_interface = gr.Interface(
+    fn=decode_audio_to_text,
+    inputs=gr.Audio(
+        label="Upload Audio File", type="numpy", sources=["upload", "microphone"]
+    ),
+    outputs=gr.Textbox(label="Decoded Text", lines=5),
+    title="📥 Decode Audio to Text",
+    description="Extract text from an audio signal using ggwave protocol",
+    theme="default",
+)
+demo = gr.TabbedInterface(
+    [encode_interface, decode_interface],
+    tab_names=["📤 Encode", "📥 Decode"],
+    title="🎵 GGWave Audio Encoder/Decoder",
+)
+demo.launch(debug=True, mcp_server=True)

audio.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5312c493329500cc6e4ec86eae210ca745a2daeaf1933e4fb41f4d529763736
+size 139308

requirements.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+ggwave @ git+https://github.com/not-lain/ggwave.git@python#subdirectory=bindings/python
+gradio
+pyaudio