Spaces:

SeaSky1027
/

AudioGAN

Build error

App Files Files Community

SeaSky1027 commited on Feb 1

Commit

1f2dc3f

1 Parent(s): a75176e

Modify requirements.txt

Browse files

Files changed (1) hide show

app.py +11 -9

app.py CHANGED Viewed

@@ -105,7 +105,7 @@ def load_model_cache():
 def generate_audio_gradio(prompt, seed):
     """Generate audio from text prompt with fixed seed (CPU)."""
     if not prompt or not prompt.strip():
-        raise gr.Error("Prompt을 입력해 주세요.")
     model_dict = load_model_cache()
@@ -150,23 +150,25 @@ input_text = gr.Textbox(lines=2, label="Prompt", placeholder="e.g. A bird is chi
 seed = gr.Number(value=42, label="Seed", minimum=0, maximum=2**32 - 1, step=1, precision=0)
 description_text = """
-### **AudioGAN**: Compact and Efficient Text-to-Audio Generation (GAN-based)
 - [📖 Paper (arXiv)](https://arxiv.org/abs/2512.22166)
 - [💻 GitHub](https://github.com/SeaSky1027/AudioGAN)
 - [🤗 Hugging Face Model](https://huggingface.co/SeaSky1027/AudioGAN)
 - [🌐 Project Page](https://seasky1027.github.io/AudioGAN/)
-이 Space는 **CPU 전용**으로 동작합니다. Prompt와 Seed를 입력한 뒤 생성 버튼을 누르면 오디오가 생성됩니다.
 """
 # Examples: Prompt and Seed only (no duration, steps, variant, etc.)
 examples_list = [
-    ["A bird is chirping in a quiet place.", 42],
-    ["Guitar and piano playing a warm music, with a soft and gentle melody.", 42],
-    ["Melodic human whistling harmonizing with natural birdsong", 123],
-    ["Chopping meat on a wooden table.", 0],
-    ["A vehicle engine revving then accelerating at a high rate.", 2024],
 ]
 gr_interface = gr.Interface(
@@ -176,7 +178,7 @@ gr_interface = gr.Interface(
         gr.Audio(label="🎵 Audio Sample", type="filepath"),
         gr.Textbox(label="Prompt Used", interactive=False),
     ],
-    title="AudioGAN: Text-to-Audio Generation",
     description=description_text,
     flagging_mode="never",
     examples=examples_list,

 def generate_audio_gradio(prompt, seed):
     """Generate audio from text prompt with fixed seed (CPU)."""
     if not prompt or not prompt.strip():
+        raise gr.Error("Enter the prompt.")
     model_dict = load_model_cache()
 seed = gr.Number(value=42, label="Seed", minimum=0, maximum=2**32 - 1, step=1, precision=0)
 description_text = """
+###
+AudioGAN is a novel GAN-based model tailored for compact and efficient text-to-audio generation.
 - [📖 Paper (arXiv)](https://arxiv.org/abs/2512.22166)
 - [💻 GitHub](https://github.com/SeaSky1027/AudioGAN)
 - [🤗 Hugging Face Model](https://huggingface.co/SeaSky1027/AudioGAN)
 - [🌐 Project Page](https://seasky1027.github.io/AudioGAN/)
+This space uses only the CPU.
+So, model inference may be slow.
+Download the code from GitHub and the weights from huggingface.
+Then, run inference on your own GPU for faster results.
 """
 # Examples: Prompt and Seed only (no duration, steps, variant, etc.)
 examples_list = [
+    ["Chopping meat on a wooden table.", 10],
+    ["A bird is chirping in a quiet place.", 27],
+    ["Melodic human whistling harmonizing with natural birdsong", 1027],
 ]
 gr_interface = gr.Interface(
         gr.Audio(label="🎵 Audio Sample", type="filepath"),
         gr.Textbox(label="Prompt Used", interactive=False),
     ],
+    title="AudioGAN: A Compact and Efficient Framework for Real-Time High-Fidelity Text-to-Audio Generation",
     description=description_text,
     flagging_mode="never",
     examples=examples_list,