Spaces:
Configuration error
Configuration error
Update app.py
Browse files
app.py
CHANGED
|
@@ -86,17 +86,20 @@ def generate_audio(prompt, seconds_total=10, steps=100, cfg_scale=7):
|
|
| 86 |
return unique_filename
|
| 87 |
|
| 88 |
# Setting up the Gradio Interface
|
|
|
|
|
|
|
| 89 |
interface = gr.Interface(
|
| 90 |
fn=generate_audio,
|
| 91 |
inputs=[
|
| 92 |
gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
|
| 93 |
gr.Slider(0, 10, value=5, label="Duration in Seconds"),
|
| 94 |
-
gr.Slider(10,
|
| 95 |
gr.Slider(1, 10, value=7, step=0.1, label="CFG Scale")
|
| 96 |
],
|
| 97 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
| 98 |
title="Synthio Stable Audio Generator",
|
| 99 |
-
description="
|
|
|
|
| 100 |
|
| 101 |
# Launch the Interface
|
| 102 |
interface.launch()
|
|
|
|
| 86 |
return unique_filename
|
| 87 |
|
| 88 |
# Setting up the Gradio Interface
|
| 89 |
+
paper_link = "https://arxiv.org/pdf/2410.02056"
|
| 90 |
+
paper_text = "Synthio: Augmenting Small-Scale Audio Classification Datasets with Synthetic Data"
|
| 91 |
interface = gr.Interface(
|
| 92 |
fn=generate_audio,
|
| 93 |
inputs=[
|
| 94 |
gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
|
| 95 |
gr.Slider(0, 10, value=5, label="Duration in Seconds"),
|
| 96 |
+
gr.Slider(10, 250, value=150, step=10, label="Number of Diffusion Steps"),
|
| 97 |
gr.Slider(1, 10, value=7, step=0.1, label="CFG Scale")
|
| 98 |
],
|
| 99 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
| 100 |
title="Synthio Stable Audio Generator",
|
| 101 |
+
description="A text-to-audio diffusion model (based on the Stable Audio DiT architecture) for generating variable length synthetic audios from text prompts at 44.1kHz.<br>"+
|
| 102 |
+
"This model was developed as part of the paper: " + f"<a href='{paper_link}'>{paper_text}</a> <br>")
|
| 103 |
|
| 104 |
# Launch the Interface
|
| 105 |
interface.launch()
|