Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -1,446 +1,90 @@
|
|
| 1 |
-
import gradio as gr
|
| 2 |
-
from openai import OpenAI
|
| 3 |
-
import requests
|
| 4 |
-
import json
|
| 5 |
-
# from volcenginesdkarkruntime import Ark
|
| 6 |
import torch
|
| 7 |
-
import
|
| 8 |
-
from einops import rearrange
|
| 9 |
-
import argparse
|
| 10 |
-
import json
|
| 11 |
-
import os
|
| 12 |
-
import spaces
|
| 13 |
-
from tqdm import tqdm
|
| 14 |
import random
|
| 15 |
-
import
|
| 16 |
-
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
|
| 26 |
-
from diffrhythm.infer.
|
| 27 |
-
|
| 28 |
-
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
-
|
| 37 |
-
|
| 38 |
-
|
| 39 |
-
|
| 40 |
-
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
-
|
| 51 |
-
raise gr.Error(f"Error: {str(e)}")
|
| 52 |
-
negative_style_prompt = get_negative_style_prompt(device)
|
| 53 |
-
latent_prompt, pred_frames = get_reference_latent(device, max_frames, edit, edit_segments, ref_audio_path, vae)
|
| 54 |
-
|
| 55 |
-
if preference_infer == "quality first":
|
| 56 |
-
batch_infer_num = 5
|
| 57 |
-
else:
|
| 58 |
-
batch_infer_num = 1
|
| 59 |
-
generated_song = inference(cfm_model=cfm,
|
| 60 |
-
vae_model=vae,
|
| 61 |
-
eval_model=eval_model,
|
| 62 |
-
eval_muq=eval_muq,
|
| 63 |
-
cond=latent_prompt,
|
| 64 |
-
text=lrc_prompt,
|
| 65 |
-
duration=end_frame,
|
| 66 |
-
style_prompt=style_prompt,
|
| 67 |
-
negative_style_prompt=negative_style_prompt,
|
| 68 |
-
steps=steps,
|
| 69 |
-
cfg_strength=cfg_strength,
|
| 70 |
-
sway_sampling_coef=sway_sampling_coef,
|
| 71 |
-
start_time=start_time,
|
| 72 |
-
file_type=file_type,
|
| 73 |
-
vocal_flag=vocal_flag,
|
| 74 |
-
odeint_method=odeint_method,
|
| 75 |
-
pred_frames=pred_frames,
|
| 76 |
-
batch_infer_num=batch_infer_num,
|
| 77 |
-
song_duration=song_duration
|
| 78 |
-
)
|
| 79 |
-
return generated_song
|
| 80 |
-
|
| 81 |
-
def R1_infer1(theme, tags_gen, language):
|
| 82 |
try:
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
|
| 86 |
-
|
| 87 |
-
|
| 88 |
-
|
| 89 |
-
|
| 90 |
-
|
| 91 |
-
|
| 92 |
-
|
| 93 |
-
|
| 94 |
-
|
| 95 |
-
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
- 错误:[01:30.00](钢琴间奏)
|
| 100 |
-
- 错误:[02:00.00][副歌]
|
| 101 |
-
- 错误:空行、换行符、注释
|
| 102 |
-
"""
|
| 103 |
-
|
| 104 |
-
response = client.chat.completions.create(
|
| 105 |
-
model="ep-20250304144033-nr9wl",
|
| 106 |
-
messages=[
|
| 107 |
-
{"role": "system", "content": "You are a professional musician who has been invited to make music-related comments."},
|
| 108 |
-
{"role": "user", "content": llm_prompt.format(theme=theme, tags=tags_gen, language=language)},
|
| 109 |
-
],
|
| 110 |
-
stream=False
|
| 111 |
)
|
| 112 |
-
|
| 113 |
-
info = response.choices[0].message.content
|
| 114 |
-
|
| 115 |
-
return info
|
| 116 |
|
| 117 |
-
|
| 118 |
-
print(f'请求出错: {e}')
|
| 119 |
-
return {}
|
| 120 |
|
|
|
|
|
|
|
| 121 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 122 |
|
| 123 |
-
|
| 124 |
-
|
| 125 |
-
|
| 126 |
-
llm_prompt = """
|
| 127 |
-
{lyrics_input}这是一首歌的歌词,每一行是一句歌词,{tags_lyrics}是我希望这首歌的风格,我现在想要给这首歌的每一句歌词打时间戳得到LRC,我希望时间戳分配应根据歌曲的标签、歌词的情感、节奏来合理推测,而非机械地按照歌词长度分配。第一句歌词的时间戳应考虑前奏长度,避免歌词从 `[00:00.00]` 直接开始。严格按照 LRC 格式输出歌词,每行格式为 `[mm:ss.xx]歌词内容`。最后的结果只输出LRC,不需要其他的解释。
|
| 128 |
-
"""
|
| 129 |
-
|
| 130 |
-
response = client.chat.completions.create(
|
| 131 |
-
model="ep-20250304144033-nr9wl",
|
| 132 |
-
messages=[
|
| 133 |
-
{"role": "system", "content": "You are a professional musician who has been invited to make music-related comments."},
|
| 134 |
-
{"role": "user", "content": llm_prompt.format(lyrics_input=lyrics_input, tags_lyrics=tags_lyrics)},
|
| 135 |
-
],
|
| 136 |
-
stream=False
|
| 137 |
-
)
|
| 138 |
-
|
| 139 |
-
info = response.choices[0].message.content
|
| 140 |
-
|
| 141 |
-
return info
|
| 142 |
-
|
| 143 |
-
css = """
|
| 144 |
-
/* 固定文本域高度并强制滚动条 */
|
| 145 |
-
.lyrics-scroll-box textarea {
|
| 146 |
-
height: 405px !important; /* 固定高度 */
|
| 147 |
-
max-height: 500px !important; /* 最大高度 */
|
| 148 |
-
overflow-y: auto !important; /* 垂直滚动 */
|
| 149 |
-
white-space: pre-wrap; /* 保留换行 */
|
| 150 |
-
line-height: 1.5; /* 行高优化 */
|
| 151 |
-
}
|
| 152 |
-
|
| 153 |
-
.gr-examples {
|
| 154 |
-
background: transparent !important;
|
| 155 |
-
border: 1px solid #e0e0e0 !important;
|
| 156 |
-
border-radius: 8px;
|
| 157 |
-
margin: 1rem 0 !important;
|
| 158 |
-
padding: 1rem !important;
|
| 159 |
-
}
|
| 160 |
-
|
| 161 |
-
"""
|
| 162 |
-
|
| 163 |
|
| 164 |
-
with gr.
|
| 165 |
-
|
| 166 |
-
<div style="display: flex; align-items: center;">
|
| 167 |
-
<img src='https://raw.githubusercontent.com/ASLP-lab/DiffRhythm/refs/heads/main/src/DiffRhythm_logo.jpg'
|
| 168 |
-
style='width: 200px; height: 40%; display: block; margin: 0 auto 20px;'>
|
| 169 |
-
</div>
|
| 170 |
-
|
| 171 |
-
<div style="flex: 1; text-align: center;">
|
| 172 |
-
<div style="font-size: 2em; font-weight: bold; text-align: center; margin-bottom: 5px">
|
| 173 |
-
Di♪♪Rhythm (谛韵)
|
| 174 |
-
</div>
|
| 175 |
-
<div style="display:flex; justify-content: center; column-gap:4px;">
|
| 176 |
-
<a href="https://arxiv.org/abs/2503.01183">
|
| 177 |
-
<img src='https://img.shields.io/badge/Arxiv-Paper-blue'>
|
| 178 |
-
</a>
|
| 179 |
-
<a href="https://github.com/ASLP-lab/DiffRhythm">
|
| 180 |
-
<img src='https://img.shields.io/badge/GitHub-Repo-green'>
|
| 181 |
-
</a>
|
| 182 |
-
<a href="https://aslp-lab.github.io/DiffRhythm.github.io/">
|
| 183 |
-
<img src='https://img.shields.io/badge/Project-Page-brown'>
|
| 184 |
-
</a>
|
| 185 |
-
</div>
|
| 186 |
-
</div>
|
| 187 |
-
""")
|
| 188 |
|
| 189 |
-
with gr.
|
| 190 |
-
|
| 191 |
-
|
| 192 |
-
|
| 193 |
-
with gr.Row():
|
| 194 |
-
with gr.Column():
|
| 195 |
-
lrc = gr.Textbox(
|
| 196 |
-
label="Lyrics",
|
| 197 |
-
placeholder="Input the full lyrics",
|
| 198 |
-
lines=12,
|
| 199 |
-
max_lines=50,
|
| 200 |
-
elem_classes="lyrics-scroll-box",
|
| 201 |
-
value="""[00:04.074] Tell me that I'm special\n[00:06.226] Tell me I look pretty\n[00:08.175] Tell me I'm a little angel\n[00:10.175] Sweetheart of your city\n[00:13.307] Say what I'm dying to hear\n[00:17.058] 'Cause I'm dying to hear you\n[00:20.523] Tell me I'm that new thing\n[00:22.571] Tell me that I'm relevant\n[00:24.723] Tell me that I got a big heart\n[00:26.723] Then back it up with evidence\n[00:29.408] I need it and I don't know why\n[00:33.907] This late at night\n[00:36.139] Isn't it lonely\n[00:38.991] I'd do anything to make you want me\n[00:43.222] I'd give it all up if you told me\n[00:47.339] That I'd be\n[00:49.157] The number one girl in your eyes\n[00:52.506] Your one and only\n[00:55.437] So what's it gon' take for you to want me\n[00:59.589] I'd give it all up if you told me\n[01:03.674] That I'd be\n[01:05.823] The number one girl in your eyes\n[01:10.841] Tell me I'm going real big places\n[01:14.055] Down to earth, so friendly\n[01:16.105] And even through all the phases\n[01:18.256] Tell me you accept me\n[01:21.155] Well, that's all I'm dying to hear\n[01:24.937] Yeah, I'm dying to hear you\n[01:28.521] Tell me that you need me\n[01:30.437] Tell me that I'm loved\n[01:32.740] Tell me that I'm worth it\n[01:34.605] And that I'm enough\n[01:37.571] I need it and I don't know why\n[01:41.889] This late at night\n[01:43.805] Isn't it lonely\n[01:46.871] I'd do anything to make you want me\n[01:51.004] I'd give it all up if you told me\n[01:55.237] That I'd be\n[01:57.089] The number one girl in your eyes\n[02:00.325] Your one and only\n[02:03.305] So what's it gon' take for you to want me\n[02:07.355] I'd give it all up if you told me\n[02:11.589] That I'd be\n[02:13.623] The number one girl in your eyes\n[02:16.804] The girl in your eyes\n[02:20.823] The girl in your eyes\n[02:26.055] Tell me I'm the number one girl\n[02:28.355] I'm the number one girl in your eyes\n[02:33.172] The girl in your eyes\n[02:37.321] The girl in your eyes\n[02:42.472] Tell me I'm the number one girl\n[02:44.539] I'm the number one girl in your eyes\n[02:49.605] Well isn't it lonely\n[02:52.488] I'd do anything to make you want me\n[02:56.637] I'd give it all up if you told me\n[03:00.888] That I'd be\n[03:03.172] The number one girl in your eyes\n[03:06.272] Your one and only\n[03:09.160] So what's it gon' take for you to want me\n[03:13.056] I'd give it all up if you told me\n[03:17.305] That I'd be\n[03:19.488] The number one girl in your eyes\n[03:25.420] The number one girl in your eyes\n"""
|
| 202 |
-
)
|
| 203 |
-
|
| 204 |
-
current_prompt_type = gr.State(value="audio")
|
| 205 |
-
with gr.Tabs() as inside_tabs:
|
| 206 |
-
with gr.Tab("Audio Prompt"):
|
| 207 |
-
audio_prompt = gr.Audio(label="Audio Prompt", type="filepath", value="./src/prompt/default.wav")
|
| 208 |
-
with gr.Tab("Text Prompt"):
|
| 209 |
-
text_prompt = gr.Textbox(
|
| 210 |
-
label="Text Prompt",
|
| 211 |
-
placeholder="Enter the Text Prompt, eg: emotional piano pop",
|
| 212 |
-
)
|
| 213 |
-
def update_prompt_type(evt: gr.SelectData):
|
| 214 |
-
return "audio" if evt.index == 0 else "text"
|
| 215 |
-
|
| 216 |
-
inside_tabs.select(
|
| 217 |
-
fn=update_prompt_type,
|
| 218 |
-
outputs=current_prompt_type
|
| 219 |
-
)
|
| 220 |
-
|
| 221 |
-
with gr.Column():
|
| 222 |
-
with gr.Accordion("Best Practices Guide", open=True):
|
| 223 |
-
gr.Markdown("""
|
| 224 |
-
1. **Lyrics Format Requirements**
|
| 225 |
-
- Each line must follow: `[mm:ss.xx]Lyric content`
|
| 226 |
-
- Example of valid format:
|
| 227 |
-
```
|
| 228 |
-
[00:10.00]Moonlight spills through broken blinds
|
| 229 |
-
[00:13.20]Your shadow dances on the dashboard shrine
|
| 230 |
-
```
|
| 231 |
-
|
| 232 |
-
2. **Generation Duration Limits**
|
| 233 |
-
- The generated music must be between **95 seconds (1:35)** and **285 seconds (4:45)** in length
|
| 234 |
-
- The latest valid lyric timestamp cannot exceed **04:45.00 (285s)**
|
| 235 |
-
|
| 236 |
-
3. **Audio Prompt Requirements**
|
| 237 |
-
- Reference audio should be ≥ 1 second, Audio >10 seconds will be randomly clipped into 10 seconds
|
| 238 |
-
- For optimal results, the 10-second clips should be carefully selected
|
| 239 |
-
- Shorter clips may lead to incoherent generation
|
| 240 |
-
|
| 241 |
-
4. **Supported Languages**
|
| 242 |
-
- Chinese and English
|
| 243 |
-
- More languages comming soon
|
| 244 |
-
|
| 245 |
-
5. **Others**
|
| 246 |
-
- If loading audio result is slow, you can select Output Format as mp3 in Advanced Settings.
|
| 247 |
-
""")
|
| 248 |
-
# Music_Duration = gr.Radio(["95s", "285s"], label="Music Duration", value="95s")
|
| 249 |
-
Music_Duration = gr.Slider(
|
| 250 |
-
minimum=95,
|
| 251 |
-
maximum=285,
|
| 252 |
-
step=1,
|
| 253 |
-
value=95,
|
| 254 |
-
label="Music Duration (s)",
|
| 255 |
-
interactive=True
|
| 256 |
-
)
|
| 257 |
-
preference_infer = gr.Radio(["quality first", "speed first"], label="Preference", value="quality first")
|
| 258 |
-
lyrics_btn = gr.Button("Generate", variant="primary")
|
| 259 |
-
audio_output = gr.Audio(label="Audio Result", type="filepath", elem_id="audio_output")
|
| 260 |
-
with gr.Accordion("Advanced Settings", open=False):
|
| 261 |
-
seed = gr.Slider(
|
| 262 |
-
label="Seed",
|
| 263 |
-
minimum=0,
|
| 264 |
-
maximum=MAX_SEED,
|
| 265 |
-
step=1,
|
| 266 |
-
value=0,
|
| 267 |
-
)
|
| 268 |
-
randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
|
| 269 |
-
|
| 270 |
-
steps = gr.Slider(
|
| 271 |
-
minimum=10,
|
| 272 |
-
maximum=100,
|
| 273 |
-
value=32,
|
| 274 |
-
step=1,
|
| 275 |
-
label="Diffusion Steps",
|
| 276 |
-
interactive=True,
|
| 277 |
-
elem_id="step_slider"
|
| 278 |
-
)
|
| 279 |
-
cfg_strength = gr.Slider(
|
| 280 |
-
minimum=1,
|
| 281 |
-
maximum=10,
|
| 282 |
-
value=4.0,
|
| 283 |
-
step=0.5,
|
| 284 |
-
label="CFG Strength",
|
| 285 |
-
interactive=True,
|
| 286 |
-
elem_id="step_slider"
|
| 287 |
-
)
|
| 288 |
-
# edit = gr.Checkbox(label="edit", value=False)
|
| 289 |
-
# edit = False
|
| 290 |
-
# preference_infer = gr.Radio(["quality first", "speed first"], label="Preference", value="quality first")
|
| 291 |
-
# edit_segments = gr.Textbox(
|
| 292 |
-
# label="Edit Segments",
|
| 293 |
-
# placeholder="Time segments to edit (in seconds). Format: `[[start1,end1],...]",
|
| 294 |
-
# )
|
| 295 |
-
|
| 296 |
-
odeint_method = gr.Radio(["euler", "midpoint", "rk4","implicit_adams"], label="ODE Solver", value="euler")
|
| 297 |
-
file_type = gr.Dropdown(["wav", "mp3", "ogg"], label="Output Format", value="mp3")
|
| 298 |
-
|
| 299 |
-
|
| 300 |
-
gr.Examples(
|
| 301 |
-
examples=[
|
| 302 |
-
["./src/prompt/pop_cn.wav"],
|
| 303 |
-
["./src/prompt/pop_en.wav"],
|
| 304 |
-
["./src/prompt/rock_cn.wav"],
|
| 305 |
-
["./src/prompt/rock_en.wav"],
|
| 306 |
-
["./src/prompt/country_cn.wav"],
|
| 307 |
-
["./src/prompt/country_en.wav"],
|
| 308 |
-
["./src/prompt/classic_cn.wav"],
|
| 309 |
-
["./src/prompt/classic_en.wav"],
|
| 310 |
-
["./src/prompt/jazz_cn.wav"],
|
| 311 |
-
["./src/prompt/jazz_en.wav"],
|
| 312 |
-
["./src/prompt/rap_cn.wav"],
|
| 313 |
-
["./src/prompt/rap_en.wav"],
|
| 314 |
-
["./src/prompt/default.wav"]
|
| 315 |
-
],
|
| 316 |
-
inputs=[audio_prompt],
|
| 317 |
-
label="Audio Examples",
|
| 318 |
-
examples_per_page=13,
|
| 319 |
-
elem_id="audio-examples-container"
|
| 320 |
-
)
|
| 321 |
-
|
| 322 |
-
gr.Examples(
|
| 323 |
-
examples=[
|
| 324 |
-
["Pop Emotional Piano"],
|
| 325 |
-
["流行 情感 钢琴"],
|
| 326 |
-
["Indie folk ballad, coming-of-age themes, acoustic guitar picking with harmonica interludes"],
|
| 327 |
-
["独立民谣, 成长主题, 原声吉他弹奏与口琴间奏"]
|
| 328 |
-
],
|
| 329 |
-
inputs=[text_prompt],
|
| 330 |
-
label="Text Examples",
|
| 331 |
-
examples_per_page=4,
|
| 332 |
-
elem_id="text-examples-container"
|
| 333 |
-
)
|
| 334 |
|
| 335 |
-
|
| 336 |
-
examples=[
|
| 337 |
-
["""[00:04.074] Tell me that I'm special\n[00:06.226] Tell me I look pretty\n[00:08.175] Tell me I'm a little angel\n[00:10.175] Sweetheart of your city\n[00:13.307] Say what I'm dying to hear\n[00:17.058] 'Cause I'm dying to hear you\n[00:20.523] Tell me I'm that new thing\n[00:22.571] Tell me that I'm relevant\n[00:24.723] Tell me that I got a big heart\n[00:26.723] Then back it up with evidence\n[00:29.408] I need it and I don't know why\n[00:33.907] This late at night\n[00:36.139] Isn't it lonely\n[00:38.991] I'd do anything to make you want me\n[00:43.222] I'd give it all up if you told me\n[00:47.339] That I'd be\n[00:49.157] The number one girl in your eyes\n[00:52.506] Your one and only\n[00:55.437] So what's it gon' take for you to want me\n[00:59.589] I'd give it all up if you told me\n[01:03.674] That I'd be\n[01:05.823] The number one girl in your eyes\n[01:10.841] Tell me I'm going real big places\n[01:14.055] Down to earth, so friendly\n[01:16.105] And even through all the phases\n[01:18.256] Tell me you accept me\n[01:21.155] Well, that's all I'm dying to hear\n[01:24.937] Yeah, I'm dying to hear you\n[01:28.521] Tell me that you need me\n[01:30.437] Tell me that I'm loved\n[01:32.740] Tell me that I'm worth it\n[01:34.605] And that I'm enough\n[01:37.571] I need it and I don't know why\n[01:41.889] This late at night\n[01:43.805] Isn't it lonely\n[01:46.871] I'd do anything to make you want me\n[01:51.004] I'd give it all up if you told me\n[01:55.237] That I'd be\n[01:57.089] The number one girl in your eyes\n[02:00.325] Your one and only\n[02:03.305] So what's it gon' take for you to want me\n[02:07.355] I'd give it all up if you told me\n[02:11.589] That I'd be\n[02:13.623] The number one girl in your eyes\n[02:16.804] The girl in your eyes\n[02:20.823] The girl in your eyes\n[02:26.055] Tell me I'm the number one girl\n[02:28.355] I'm the number one girl in your eyes\n[02:33.172] The girl in your eyes\n[02:37.321] The girl in your eyes\n[02:42.472] Tell me I'm the number one girl\n[02:44.539] I'm the number one girl in your eyes\n[02:49.605] Well isn't it lonely\n[02:52.488] I'd do anything to make you want me\n[02:56.637] I'd give it all up if you told me\n[03:00.888] That I'd be\n[03:03.172] The number one girl in your eyes\n[03:06.272] Your one and only\n[03:09.160] So what's it gon' take for you to want me\n[03:13.056] I'd give it all up if you told me\n[03:17.305] That I'd be\n[03:19.488] The number one girl in your eyes\n[03:25.420] The number one girl in your eyes\n"""],
|
| 338 |
-
["""[00:00.133]Abracadabra, abracadabra\n[00:03.985]Abracadabra, abracadabra\n[00:15.358]Pay the toll to the angels\n[00:18.694]Drawin' circles in the clouds\n[00:22.966]Keep your mind on the distance\n[00:26.321]When the devil turns around\n[00:30.540]Hold me in your heart tonight\n[00:33.751]In the magic of the dark moonlight\n[00:38.189]Save me from this empty fight\n[00:43.521]In the game of life\n[00:45.409]Like a poem said by a lady in red\n[00:49.088]You hear the last few words of your life\n[00:53.013]With a haunting dance, now you're both in a trance\n[00:56.687]It's time to cast your spell on the night\n[01:01.131]Abracadabra amor-oo-na-na\n[01:04.394]Abracadabra morta-oo-gaga\n[01:08.778]Abracadabra, abra-ooh-na-na\n[01:12.063]In her tongue, she's sayin'\n[01:14.367]Death or love tonight\n[01:18.249]Abracadabra, abracadabra\n[01:22.136]Abracadabra, abracadabra\n[01:25.859]Feel the beat under your feet\n[01:27.554]The floor's on fire\n[01:29.714]Abracadabra, abracadabra\n[01:33.464]Choose the road on the west side\n[01:36.818]As the dust flies, watch it burn\n[01:41.057]Don't waste time on feeling\n[01:44.419]Use your passion no return\n[01:48.724]Hold me in your heart tonight\n[01:51.886]In the magic of the dark moonlight\n[01:56.270]Save me from this empty fight\n[02:01.599]In the game of life\n[02:03.524]Like a poem said by a lady in red\n[02:07.192]You hear the last few words of your life\n[02:11.055]With a haunting dance, now you're both in a trance\n[02:14.786]It's time to cast your spell on the night\n[02:19.225]Abracadabra amor-oo-na-na\n[02:22.553]Abracadabra morta-oo-gaga\n[02:26.852]Abracadabra, abra-ooh-na-na\n[02:30.110]In her tongue, she's sayin'\n[02:32.494]Death or love tonight\n[02:36.244]Abracadabra, abracadabra\n[02:40.161]Abracadabra, abracadabra\n[02:43.966]Feel the beat under your feet\n[02:45.630]The floor's on fire\n[02:47.812]Abracadabra, abracadabra\n[02:50.537]Phantom of the dancefloor, come to me\n[02:58.169]Sing for me a sinful melody\n[03:05.833]Ah-ah-ah-ah-ah, ah-ah, ah-ah\n[03:13.453]Ah-ah-ah-ah-ah, ah-ah, ah-ah\n[03:22.025]Abracadabra amor-oo-na-na\n[03:25.423]Abracadabra morta-oo-gaga\n[03:29.674]Abracadabra, abra-ooh-na-na\n[03:33.013]In her tongue, she's sayin'\n[03:35.401]Death or love tonight\n"""],
|
| 339 |
-
["""[00:00.27]只��你太美 baby 只因你太美 baby\n[00:08.95]只因你实在是太美 baby\n[00:13.99]只因你太美 baby\n[00:18.89]迎面走来的你让我如此蠢蠢欲动\n[00:20.88]这种感觉我从未有\n[00:21.79]Cause I got a crush on you who you\n[00:25.74]你是我的我是你的谁\n[00:28.09]再多一眼看一眼就会爆炸\n[00:30.31]再近一点靠近点快被融化\n[00:32.49]想要把你占为己有 baby bae\n[00:34.60]不管走到哪里\n[00:35.44]都会想起的人是你 you you\n[00:38.12]我应该拿你怎样\n[00:39.61]Uh 所有人都在看着你\n[00:42.36]我的心总是不安\n[00:44.18]Oh 我现在已病入膏肓\n[00:46.63]Eh oh\n[00:47.84]难道真的因你而疯狂吗\n[00:51.57]我本来不是这种人\n[00:53.59]因你变成奇怪的人\n[00:55.77]第一次呀变成这样的我\n[01:01.23]不管我怎么去否认\n[01:03.21]只因你太美 baby 只因你太美 baby\n[01:11.46]只因你实在是太美 baby\n[01:16.75]只因你太美 baby\n[01:21.09]Oh eh oh\n[01:22.82]现在确认地告诉我\n[01:25.26]Oh eh oh\n[01:27.31]你到底属于谁\n[01:29.98]Oh eh oh\n[01:31.70]现在确认地告诉我\n[01:34.45]Oh eh oh\n"""],
|
| 340 |
-
["""[00:19.50]也想不到要怎么问你别来无恙\n[00:25.71]世界乱的一塌糊涂可是能怎样\n[00:31.85]偶尔抬起头来还好有颗月亮可赏\n[00:38.96]太多回忆要我怎么摆进行李箱\n[00:45.22]一直没哭一直走路走灰多少太阳\n[00:51.70]因为往事没有办法悬赏 隐形在那大街小巷\n[01:00.22]剪断了它还嚣张\n[01:03.85]我的嘴在说谎 说的那么漂亮\n[01:10.07]说我早就忘了你像月一样的俏脸庞\n[01:16.51]最怕一边忙呀忙一边回想那旧时光\n[01:22.87]剪不掉的是你 带泪的脸 还真是烦\n[01:43.32]多少原因将我绑在半夜屋顶上\n[01:49.23]一直没再爱一个人如今就是这样\n[01:55.75]因为故事跟你说了一半 于是搁在所谓云端\n[02:04.21]谁忘不了谁孤单\n[02:07.79]我的心在说谎 说下去会疯狂\n[02:14.02]如果没有月亮那些日子都无妨\n[02:20.43]最怕一边忙呀忙一边想那旧时光\n[02:26.91]剪不掉的是你 带笑的苦 还真烦\n[02:33.81]我的嘴又说了谎 说的那么漂亮\n[02:39.68]以为已经忘了你的那些美像月光它剪不断\n[02:47.15]因为爱早就钻进心脏 心一跳泪就会烫\n[02:52.22]那些带泪的脸 带笑的苦 还真烦\n[02:59.28]月亮是个凶手 想你的我 是通缉犯\n[03:08.03]我有时候真的很怕望见那月光中的你\n"""]
|
| 341 |
-
],
|
| 342 |
-
|
| 343 |
-
inputs=[lrc],
|
| 344 |
-
label="Lrc Examples",
|
| 345 |
-
examples_per_page=4,
|
| 346 |
-
elem_id="lrc-examples-container",
|
| 347 |
-
)
|
| 348 |
|
|
|
|
| 349 |
|
| 350 |
-
|
| 351 |
-
|
| 352 |
-
|
| 353 |
-
|
| 354 |
-
with gr.Accordion("Notice", open=False):
|
| 355 |
-
gr.Markdown("**Two Generation Modes:**\n1. Generate from theme & tags\n2. Add timestamps to existing lyrics")
|
| 356 |
-
|
| 357 |
-
with gr.Group():
|
| 358 |
-
gr.Markdown("### Method 1: Generate from Theme")
|
| 359 |
-
theme = gr.Textbox(label="theme", placeholder="Enter song theme, e.g: Love and Heartbreak")
|
| 360 |
-
tags_gen = gr.Textbox(label="tags", placeholder="Enter song tags, e.g: pop confidence healing")
|
| 361 |
-
language = gr.Radio(["cn", "en"], label="Language", value="en")
|
| 362 |
-
gen_from_theme_btn = gr.Button("Generate LRC (From Theme)", variant="primary")
|
| 363 |
-
|
| 364 |
-
gr.Examples(
|
| 365 |
-
examples=[
|
| 366 |
-
[
|
| 367 |
-
"Love and Heartbreak",
|
| 368 |
-
"vocal emotional piano pop",
|
| 369 |
-
"en"
|
| 370 |
-
],
|
| 371 |
-
[
|
| 372 |
-
"Heroic Epic",
|
| 373 |
-
"choir orchestral powerful",
|
| 374 |
-
"cn"
|
| 375 |
-
]
|
| 376 |
-
],
|
| 377 |
-
inputs=[theme, tags_gen, language],
|
| 378 |
-
label="Examples: Generate from Theme"
|
| 379 |
-
)
|
| 380 |
-
|
| 381 |
-
with gr.Group(visible=True):
|
| 382 |
-
gr.Markdown("### Method 2: Add Timestamps to Lyrics")
|
| 383 |
-
tags_lyrics = gr.Textbox(label="tags", placeholder="Enter song tags, e.g: ballad piano slow")
|
| 384 |
-
lyrics_input = gr.Textbox(
|
| 385 |
-
label="Raw Lyrics (without timestamps)",
|
| 386 |
-
placeholder="Enter plain lyrics (without timestamps), e.g:\nYesterday\nAll my troubles...",
|
| 387 |
-
lines=10,
|
| 388 |
-
max_lines=50,
|
| 389 |
-
elem_classes="lyrics-scroll-box"
|
| 390 |
-
)
|
| 391 |
-
|
| 392 |
-
gen_from_lyrics_btn = gr.Button("Generate LRC (From Lyrics)", variant="primary")
|
| 393 |
-
|
| 394 |
-
gr.Examples(
|
| 395 |
-
examples=[
|
| 396 |
-
[
|
| 397 |
-
"acoustic folk happy",
|
| 398 |
-
"""I'm sitting here in the boring room\nIt's just another rainy Sunday afternoon"""
|
| 399 |
-
],
|
| 400 |
-
[
|
| 401 |
-
"electronic dance energetic",
|
| 402 |
-
"""We're living in a material world\nAnd I am a material girl"""
|
| 403 |
-
]
|
| 404 |
-
],
|
| 405 |
-
inputs=[tags_lyrics, lyrics_input],
|
| 406 |
-
label="Examples: Generate from Lyrics"
|
| 407 |
-
)
|
| 408 |
-
|
| 409 |
-
|
| 410 |
-
with gr.Column():
|
| 411 |
-
lrc_output = gr.Textbox(
|
| 412 |
-
label="Generated LRC",
|
| 413 |
-
placeholder="Timed lyrics will appear here",
|
| 414 |
-
lines=57,
|
| 415 |
-
elem_classes="lrc-output",
|
| 416 |
-
show_copy_button=True
|
| 417 |
-
)
|
| 418 |
-
|
| 419 |
-
# Bind functions
|
| 420 |
-
gen_from_theme_btn.click(
|
| 421 |
-
fn=R1_infer1,
|
| 422 |
-
inputs=[theme, tags_gen, language],
|
| 423 |
-
outputs=lrc_output
|
| 424 |
-
)
|
| 425 |
-
|
| 426 |
-
gen_from_lyrics_btn.click(
|
| 427 |
-
fn=R1_infer2,
|
| 428 |
-
inputs=[tags_lyrics, lyrics_input],
|
| 429 |
-
outputs=lrc_output
|
| 430 |
-
)
|
| 431 |
-
|
| 432 |
-
tabs.select(
|
| 433 |
-
lambda s: None,
|
| 434 |
-
None,
|
| 435 |
-
None
|
| 436 |
-
)
|
| 437 |
-
|
| 438 |
-
lyrics_btn.click(
|
| 439 |
-
fn=infer_music,
|
| 440 |
-
inputs=[lrc, audio_prompt, text_prompt, current_prompt_type, seed, randomize_seed, steps, cfg_strength, file_type, odeint_method, preference_infer, Music_Duration],
|
| 441 |
-
outputs=audio_output
|
| 442 |
)
|
| 443 |
|
| 444 |
-
|
| 445 |
-
if __name__ == "__main__":
|
| 446 |
-
demo.launch()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
import torch
|
| 2 |
+
import gradio as gr
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3 |
import random
|
| 4 |
+
import traceback
|
| 5 |
+
|
| 6 |
+
# -------------------------------------------------
|
| 7 |
+
# FORCE CPU (FREE TIER SAFE)
|
| 8 |
+
# -------------------------------------------------
|
| 9 |
+
device = "cpu"
|
| 10 |
+
print("Running in CPU mode (Free tier safe)")
|
| 11 |
+
|
| 12 |
+
# -------------------------------------------------
|
| 13 |
+
# IMPORT YOUR ORIGINAL UTILITIES
|
| 14 |
+
# -------------------------------------------------
|
| 15 |
+
from diffrhythm.infer.infer_utils import prepare_model, infer_music
|
| 16 |
+
|
| 17 |
+
# -------------------------------------------------
|
| 18 |
+
# LOAD MODEL (REDUCED MEMORY MODE)
|
| 19 |
+
# -------------------------------------------------
|
| 20 |
+
try:
|
| 21 |
+
cfm, tokenizer, muq, vae, eval_model, eval_muq = prepare_model(
|
| 22 |
+
max_frames=2048, # Reduced from 6144
|
| 23 |
+
device=device
|
| 24 |
+
)
|
| 25 |
+
print("Model loaded successfully.")
|
| 26 |
+
except Exception as e:
|
| 27 |
+
print("Model loading failed:")
|
| 28 |
+
print(traceback.format_exc())
|
| 29 |
+
raise e
|
| 30 |
+
|
| 31 |
+
# -------------------------------------------------
|
| 32 |
+
# SAFE GENERATION FUNCTION
|
| 33 |
+
# -------------------------------------------------
|
| 34 |
+
def generate_music(
|
| 35 |
+
prompt,
|
| 36 |
+
duration,
|
| 37 |
+
guidance_scale,
|
| 38 |
+
seed
|
| 39 |
+
):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 40 |
try:
|
| 41 |
+
if seed == -1:
|
| 42 |
+
seed = random.randint(0, 999999)
|
| 43 |
+
|
| 44 |
+
torch.manual_seed(int(seed))
|
| 45 |
+
|
| 46 |
+
audio = infer_music(
|
| 47 |
+
cfm=cfm,
|
| 48 |
+
tokenizer=tokenizer,
|
| 49 |
+
muq=muq,
|
| 50 |
+
vae=vae,
|
| 51 |
+
eval_model=eval_model,
|
| 52 |
+
eval_muq=eval_muq,
|
| 53 |
+
prompt=prompt,
|
| 54 |
+
duration=int(duration),
|
| 55 |
+
guidance_scale=float(guidance_scale),
|
| 56 |
+
device=device
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 57 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
| 58 |
|
| 59 |
+
return audio
|
|
|
|
|
|
|
| 60 |
|
| 61 |
+
except Exception as e:
|
| 62 |
+
return f"Error during generation:\n{traceback.format_exc()}"
|
| 63 |
|
| 64 |
+
# -------------------------------------------------
|
| 65 |
+
# GRADIO UI
|
| 66 |
+
# -------------------------------------------------
|
| 67 |
+
with gr.Blocks() as demo:
|
| 68 |
|
| 69 |
+
gr.Markdown("# 🎵 DiffRhythm (CPU Safe Version)")
|
| 70 |
+
gr.Markdown("Running on Free CPU mode. Generation will be slow.")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 71 |
|
| 72 |
+
with gr.Row():
|
| 73 |
+
prompt = gr.Textbox(label="Music Prompt", placeholder="Describe the music...")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 74 |
|
| 75 |
+
with gr.Row():
|
| 76 |
+
duration = gr.Slider(5, 30, value=10, step=1, label="Duration (seconds)")
|
| 77 |
+
guidance = gr.Slider(1, 10, value=5, step=0.5, label="Guidance Scale")
|
| 78 |
+
seed = gr.Number(value=-1, label="Seed (-1 = random)")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 79 |
|
| 80 |
+
generate_btn = gr.Button("Generate Music")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 81 |
|
| 82 |
+
output_audio = gr.Audio(label="Generated Audio")
|
| 83 |
|
| 84 |
+
generate_btn.click(
|
| 85 |
+
fn=generate_music,
|
| 86 |
+
inputs=[prompt, duration, guidance, seed],
|
| 87 |
+
outputs=output_audio
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 88 |
)
|
| 89 |
|
| 90 |
+
demo.launch()
|
|
|
|
|
|