Spaces:
Runtime error
Runtime error
feat: Make app more informative
Browse files
app.py
CHANGED
|
@@ -157,13 +157,36 @@ def generate_caption(audio_file):
|
|
| 157 |
return outputs
|
| 158 |
|
| 159 |
|
| 160 |
-
|
| 161 |
-
|
| 162 |
-
|
| 163 |
-
|
| 164 |
-
|
| 165 |
-
|
| 166 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 167 |
|
| 168 |
if __name__ == "__main__":
|
| 169 |
demo.launch()
|
|
|
|
| 157 |
return outputs
|
| 158 |
|
| 159 |
|
| 160 |
+
with gr.Blocks(title="SonicVerse") as demo:
|
| 161 |
+
gr.Markdown("""
|
| 162 |
+
# 🎼 SonicVerse: Music Captioning Demo
|
| 163 |
+
|
| 164 |
+
Welcome to **SonicVerse**, a multi-task music captioning model that provides natural language descriptions of input clips.
|
| 165 |
+
|
| 166 |
+
🎵 Captions include music features such as:
|
| 167 |
+
- Genre
|
| 168 |
+
- Mood
|
| 169 |
+
- Instrumentation
|
| 170 |
+
- Vocals
|
| 171 |
+
- Key
|
| 172 |
+
|
| 173 |
+
📘 [Read the Paper](https://arxiv.org/abs/2506.15154)
|
| 174 |
+
|
| 175 |
+
🖥️ [Replicate locally](https://github.com/amaai-lab/SonicVerse)
|
| 176 |
+
|
| 177 |
+
|
| 178 |
+
⚠️ **Note:** You can upload audio of any length, but due to compute limits on Hugging Face Spaces,
|
| 179 |
+
it is recommended to keep clips under 30 seconds unless you have a Pro account or run this locally.
|
| 180 |
+
""")
|
| 181 |
+
|
| 182 |
+
with gr.Row():
|
| 183 |
+
audio_input = gr.Audio(type="filepath", label="Upload your music clip")
|
| 184 |
+
caption_output = gr.Textbox(label="Generated Caption", lines=8)
|
| 185 |
+
|
| 186 |
+
submit_btn = gr.Button("Generate Caption")
|
| 187 |
+
submit_btn.click(fn=caption_audio, inputs=audio_input, outputs=caption_output)
|
| 188 |
+
|
| 189 |
+
|
| 190 |
|
| 191 |
if __name__ == "__main__":
|
| 192 |
demo.launch()
|