Coiland commited on
Commit
07aaa94
·
verified ·
1 Parent(s): f0f1b62

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +75 -431
app.py CHANGED
@@ -1,446 +1,90 @@
1
- import gradio as gr
2
- from openai import OpenAI
3
- import requests
4
- import json
5
- # from volcenginesdkarkruntime import Ark
6
  import torch
7
- import torchaudio
8
- from einops import rearrange
9
- import argparse
10
- import json
11
- import os
12
- import spaces
13
- from tqdm import tqdm
14
  import random
15
- import numpy as np
16
- import sys
17
- import base64
18
- from diffrhythm.infer.infer_utils import (
19
- get_reference_latent,
20
- get_lrc_token,
21
- get_audio_style_prompt,
22
- get_text_style_prompt,
23
- prepare_model,
24
- get_negative_style_prompt
25
- )
26
- from diffrhythm.infer.infer import inference
27
-
28
- MAX_SEED = np.iinfo(np.int32).max
29
- device='cuda'
30
- cfm, tokenizer, muq, vae, eval_model, eval_muq = prepare_model(max_frames=6144, device=device)
31
- cfm = torch.compile(cfm)
32
-
33
- @spaces.GPU
34
- def infer_music(lrc, ref_audio_path, text_prompt, current_prompt_type, seed=42,
35
- randomize_seed=False, steps=32, cfg_strength=4.0, file_type='wav',
36
- odeint_method='euler', preference_infer="quality first", Music_Duration=285, edit=False,
37
- edit_segments=None, device='cuda'):
38
- max_frames = 2048 if Music_Duration == 95 else 6144
39
- sway_sampling_coef = -1 if steps < 32 else None
40
- if randomize_seed:
41
- seed = random.randint(0, MAX_SEED)
42
- torch.manual_seed(seed)
43
- vocal_flag = False
44
- try:
45
- lrc_prompt, start_time, end_frame, song_duration = get_lrc_token(max_frames, lrc, tokenizer, Music_Duration, device)
46
- if current_prompt_type == 'audio':
47
- style_prompt, vocal_flag = get_audio_style_prompt(muq, ref_audio_path)
48
- else:
49
- style_prompt = get_text_style_prompt(muq, text_prompt)
50
- except Exception as e:
51
- raise gr.Error(f"Error: {str(e)}")
52
- negative_style_prompt = get_negative_style_prompt(device)
53
- latent_prompt, pred_frames = get_reference_latent(device, max_frames, edit, edit_segments, ref_audio_path, vae)
54
-
55
- if preference_infer == "quality first":
56
- batch_infer_num = 5
57
- else:
58
- batch_infer_num = 1
59
- generated_song = inference(cfm_model=cfm,
60
- vae_model=vae,
61
- eval_model=eval_model,
62
- eval_muq=eval_muq,
63
- cond=latent_prompt,
64
- text=lrc_prompt,
65
- duration=end_frame,
66
- style_prompt=style_prompt,
67
- negative_style_prompt=negative_style_prompt,
68
- steps=steps,
69
- cfg_strength=cfg_strength,
70
- sway_sampling_coef=sway_sampling_coef,
71
- start_time=start_time,
72
- file_type=file_type,
73
- vocal_flag=vocal_flag,
74
- odeint_method=odeint_method,
75
- pred_frames=pred_frames,
76
- batch_infer_num=batch_infer_num,
77
- song_duration=song_duration
78
- )
79
- return generated_song
80
-
81
- def R1_infer1(theme, tags_gen, language):
82
  try:
83
- client = OpenAI(api_key=os.getenv('HS_DP_API'), base_url = "https://ark.cn-beijing.volces.com/api/v3")
84
-
85
- llm_prompt = """
86
- 请围绕"{theme}"主题生成一首符合"{tags}"风格的语言为{language}的完整歌词。严格遵循以下要求:
87
-
88
- ### **强制格式规则**
89
- 1. **仅输出时间戳和歌词**,禁止任何括号、旁白、段落标记(如副歌、间奏、尾奏等注释)。
90
- 2. 每行格式必须为 `[mm:ss.xx]歌词内容`,时间戳与歌词间无空格,歌词内容需完整连贯。
91
- 3. 时间戳需自然分布,**第一句歌词起始时间不得为 [00:00.00]**,需考虑前奏空白。
92
-
93
- ### **内容与结构要求**
94
- 1. 歌词应富���变化,使情绪递进,整体连贯有层次感。**每行歌词长度应自然变化**,切勿长度一致,导致很格式化。
95
- 2. **时间戳分配应根据歌曲的标签、歌词的情感、节奏来合理推测**,而非机械地按照歌词长度分配。
96
- 3. 间奏/尾奏仅通过时间空白体现(如从 [02:30.00] 直接跳至 [02:50.00]),**无需文字描述**。
97
-
98
- ### **负面示例(禁止出现)**
99
- - 错误:[01:30.00](钢琴间奏)
100
- - 错误:[02:00.00][副歌]
101
- - 错误:空行、换行符、注释
102
- """
103
-
104
- response = client.chat.completions.create(
105
- model="ep-20250304144033-nr9wl",
106
- messages=[
107
- {"role": "system", "content": "You are a professional musician who has been invited to make music-related comments."},
108
- {"role": "user", "content": llm_prompt.format(theme=theme, tags=tags_gen, language=language)},
109
- ],
110
- stream=False
111
  )
112
-
113
- info = response.choices[0].message.content
114
-
115
- return info
116
 
117
- except requests.exceptions.RequestException as e:
118
- print(f'请求出错: {e}')
119
- return {}
120
 
 
 
121
 
 
 
 
 
122
 
123
- def R1_infer2(tags_lyrics, lyrics_input):
124
- client = OpenAI(api_key=os.getenv('HS_DP_API'), base_url = "https://ark.cn-beijing.volces.com/api/v3")
125
-
126
- llm_prompt = """
127
- {lyrics_input}这是一首歌的歌词,每一行是一句歌词,{tags_lyrics}是我希望这首歌的风格,我现在想要给这首歌的每一句歌词打时间戳得到LRC,我希望时间戳分配应根据歌曲的标签、歌词的情感、节奏来合理推测,而非机械地按照歌词长度分配。第一句歌词的时间戳应考虑前奏长度,避免歌词从 `[00:00.00]` 直接开始。严格按照 LRC 格式输出歌词,每行格式为 `[mm:ss.xx]歌词内容`。最后的结果只输出LRC,不需要其他的解释。
128
- """
129
-
130
- response = client.chat.completions.create(
131
- model="ep-20250304144033-nr9wl",
132
- messages=[
133
- {"role": "system", "content": "You are a professional musician who has been invited to make music-related comments."},
134
- {"role": "user", "content": llm_prompt.format(lyrics_input=lyrics_input, tags_lyrics=tags_lyrics)},
135
- ],
136
- stream=False
137
- )
138
-
139
- info = response.choices[0].message.content
140
-
141
- return info
142
-
143
- css = """
144
- /* 固定文本域高度并强制滚动条 */
145
- .lyrics-scroll-box textarea {
146
- height: 405px !important; /* 固定高度 */
147
- max-height: 500px !important; /* 最大高度 */
148
- overflow-y: auto !important; /* 垂直滚动 */
149
- white-space: pre-wrap; /* 保留换行 */
150
- line-height: 1.5; /* 行高优化 */
151
- }
152
-
153
- .gr-examples {
154
- background: transparent !important;
155
- border: 1px solid #e0e0e0 !important;
156
- border-radius: 8px;
157
- margin: 1rem 0 !important;
158
- padding: 1rem !important;
159
- }
160
-
161
- """
162
-
163
 
164
- with gr.Blocks(css=css) as demo:
165
- gr.HTML(f"""
166
- <div style="display: flex; align-items: center;">
167
- <img src='https://raw.githubusercontent.com/ASLP-lab/DiffRhythm/refs/heads/main/src/DiffRhythm_logo.jpg'
168
- style='width: 200px; height: 40%; display: block; margin: 0 auto 20px;'>
169
- </div>
170
-
171
- <div style="flex: 1; text-align: center;">
172
- <div style="font-size: 2em; font-weight: bold; text-align: center; margin-bottom: 5px">
173
- Di♪♪Rhythm (谛韵)
174
- </div>
175
- <div style="display:flex; justify-content: center; column-gap:4px;">
176
- <a href="https://arxiv.org/abs/2503.01183">
177
- <img src='https://img.shields.io/badge/Arxiv-Paper-blue'>
178
- </a>
179
- <a href="https://github.com/ASLP-lab/DiffRhythm">
180
- <img src='https://img.shields.io/badge/GitHub-Repo-green'>
181
- </a>
182
- <a href="https://aslp-lab.github.io/DiffRhythm.github.io/">
183
- <img src='https://img.shields.io/badge/Project-Page-brown'>
184
- </a>
185
- </div>
186
- </div>
187
- """)
188
 
189
- with gr.Tabs() as tabs:
190
-
191
- # page 1
192
- with gr.Tab("Music Generate", id=0):
193
- with gr.Row():
194
- with gr.Column():
195
- lrc = gr.Textbox(
196
- label="Lyrics",
197
- placeholder="Input the full lyrics",
198
- lines=12,
199
- max_lines=50,
200
- elem_classes="lyrics-scroll-box",
201
- value="""[00:04.074] Tell me that I'm special\n[00:06.226] Tell me I look pretty\n[00:08.175] Tell me I'm a little angel\n[00:10.175] Sweetheart of your city\n[00:13.307] Say what I'm dying to hear\n[00:17.058] 'Cause I'm dying to hear you\n[00:20.523] Tell me I'm that new thing\n[00:22.571] Tell me that I'm relevant\n[00:24.723] Tell me that I got a big heart\n[00:26.723] Then back it up with evidence\n[00:29.408] I need it and I don't know why\n[00:33.907] This late at night\n[00:36.139] Isn't it lonely\n[00:38.991] I'd do anything to make you want me\n[00:43.222] I'd give it all up if you told me\n[00:47.339] That I'd be\n[00:49.157] The number one girl in your eyes\n[00:52.506] Your one and only\n[00:55.437] So what's it gon' take for you to want me\n[00:59.589] I'd give it all up if you told me\n[01:03.674] That I'd be\n[01:05.823] The number one girl in your eyes\n[01:10.841] Tell me I'm going real big places\n[01:14.055] Down to earth, so friendly\n[01:16.105] And even through all the phases\n[01:18.256] Tell me you accept me\n[01:21.155] Well, that's all I'm dying to hear\n[01:24.937] Yeah, I'm dying to hear you\n[01:28.521] Tell me that you need me\n[01:30.437] Tell me that I'm loved\n[01:32.740] Tell me that I'm worth it\n[01:34.605] And that I'm enough\n[01:37.571] I need it and I don't know why\n[01:41.889] This late at night\n[01:43.805] Isn't it lonely\n[01:46.871] I'd do anything to make you want me\n[01:51.004] I'd give it all up if you told me\n[01:55.237] That I'd be\n[01:57.089] The number one girl in your eyes\n[02:00.325] Your one and only\n[02:03.305] So what's it gon' take for you to want me\n[02:07.355] I'd give it all up if you told me\n[02:11.589] That I'd be\n[02:13.623] The number one girl in your eyes\n[02:16.804] The girl in your eyes\n[02:20.823] The girl in your eyes\n[02:26.055] Tell me I'm the number one girl\n[02:28.355] I'm the number one girl in your eyes\n[02:33.172] The girl in your eyes\n[02:37.321] The girl in your eyes\n[02:42.472] Tell me I'm the number one girl\n[02:44.539] I'm the number one girl in your eyes\n[02:49.605] Well isn't it lonely\n[02:52.488] I'd do anything to make you want me\n[02:56.637] I'd give it all up if you told me\n[03:00.888] That I'd be\n[03:03.172] The number one girl in your eyes\n[03:06.272] Your one and only\n[03:09.160] So what's it gon' take for you to want me\n[03:13.056] I'd give it all up if you told me\n[03:17.305] That I'd be\n[03:19.488] The number one girl in your eyes\n[03:25.420] The number one girl in your eyes\n"""
202
- )
203
-
204
- current_prompt_type = gr.State(value="audio")
205
- with gr.Tabs() as inside_tabs:
206
- with gr.Tab("Audio Prompt"):
207
- audio_prompt = gr.Audio(label="Audio Prompt", type="filepath", value="./src/prompt/default.wav")
208
- with gr.Tab("Text Prompt"):
209
- text_prompt = gr.Textbox(
210
- label="Text Prompt",
211
- placeholder="Enter the Text Prompt, eg: emotional piano pop",
212
- )
213
- def update_prompt_type(evt: gr.SelectData):
214
- return "audio" if evt.index == 0 else "text"
215
-
216
- inside_tabs.select(
217
- fn=update_prompt_type,
218
- outputs=current_prompt_type
219
- )
220
-
221
- with gr.Column():
222
- with gr.Accordion("Best Practices Guide", open=True):
223
- gr.Markdown("""
224
- 1. **Lyrics Format Requirements**
225
- - Each line must follow: `[mm:ss.xx]Lyric content`
226
- - Example of valid format:
227
- ```
228
- [00:10.00]Moonlight spills through broken blinds
229
- [00:13.20]Your shadow dances on the dashboard shrine
230
- ```
231
-
232
- 2. **Generation Duration Limits**
233
- - The generated music must be between **95 seconds (1:35)** and **285 seconds (4:45)** in length
234
- - The latest valid lyric timestamp cannot exceed **04:45.00 (285s)**
235
-
236
- 3. **Audio Prompt Requirements**
237
- - Reference audio should be ≥ 1 second, Audio >10 seconds will be randomly clipped into 10 seconds
238
- - For optimal results, the 10-second clips should be carefully selected
239
- - Shorter clips may lead to incoherent generation
240
-
241
- 4. **Supported Languages**
242
- - Chinese and English
243
- - More languages comming soon
244
-
245
- 5. **Others**
246
- - If loading audio result is slow, you can select Output Format as mp3 in Advanced Settings.
247
- """)
248
- # Music_Duration = gr.Radio(["95s", "285s"], label="Music Duration", value="95s")
249
- Music_Duration = gr.Slider(
250
- minimum=95,
251
- maximum=285,
252
- step=1,
253
- value=95,
254
- label="Music Duration (s)",
255
- interactive=True
256
- )
257
- preference_infer = gr.Radio(["quality first", "speed first"], label="Preference", value="quality first")
258
- lyrics_btn = gr.Button("Generate", variant="primary")
259
- audio_output = gr.Audio(label="Audio Result", type="filepath", elem_id="audio_output")
260
- with gr.Accordion("Advanced Settings", open=False):
261
- seed = gr.Slider(
262
- label="Seed",
263
- minimum=0,
264
- maximum=MAX_SEED,
265
- step=1,
266
- value=0,
267
- )
268
- randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
269
-
270
- steps = gr.Slider(
271
- minimum=10,
272
- maximum=100,
273
- value=32,
274
- step=1,
275
- label="Diffusion Steps",
276
- interactive=True,
277
- elem_id="step_slider"
278
- )
279
- cfg_strength = gr.Slider(
280
- minimum=1,
281
- maximum=10,
282
- value=4.0,
283
- step=0.5,
284
- label="CFG Strength",
285
- interactive=True,
286
- elem_id="step_slider"
287
- )
288
- # edit = gr.Checkbox(label="edit", value=False)
289
- # edit = False
290
- # preference_infer = gr.Radio(["quality first", "speed first"], label="Preference", value="quality first")
291
- # edit_segments = gr.Textbox(
292
- # label="Edit Segments",
293
- # placeholder="Time segments to edit (in seconds). Format: `[[start1,end1],...]",
294
- # )
295
-
296
- odeint_method = gr.Radio(["euler", "midpoint", "rk4","implicit_adams"], label="ODE Solver", value="euler")
297
- file_type = gr.Dropdown(["wav", "mp3", "ogg"], label="Output Format", value="mp3")
298
-
299
-
300
- gr.Examples(
301
- examples=[
302
- ["./src/prompt/pop_cn.wav"],
303
- ["./src/prompt/pop_en.wav"],
304
- ["./src/prompt/rock_cn.wav"],
305
- ["./src/prompt/rock_en.wav"],
306
- ["./src/prompt/country_cn.wav"],
307
- ["./src/prompt/country_en.wav"],
308
- ["./src/prompt/classic_cn.wav"],
309
- ["./src/prompt/classic_en.wav"],
310
- ["./src/prompt/jazz_cn.wav"],
311
- ["./src/prompt/jazz_en.wav"],
312
- ["./src/prompt/rap_cn.wav"],
313
- ["./src/prompt/rap_en.wav"],
314
- ["./src/prompt/default.wav"]
315
- ],
316
- inputs=[audio_prompt],
317
- label="Audio Examples",
318
- examples_per_page=13,
319
- elem_id="audio-examples-container"
320
- )
321
-
322
- gr.Examples(
323
- examples=[
324
- ["Pop Emotional Piano"],
325
- ["流行 情感 钢琴"],
326
- ["Indie folk ballad, coming-of-age themes, acoustic guitar picking with harmonica interludes"],
327
- ["独立民谣, 成长主题, 原声吉他弹奏与口琴间奏"]
328
- ],
329
- inputs=[text_prompt],
330
- label="Text Examples",
331
- examples_per_page=4,
332
- elem_id="text-examples-container"
333
- )
334
 
335
- gr.Examples(
336
- examples=[
337
- ["""[00:04.074] Tell me that I'm special\n[00:06.226] Tell me I look pretty\n[00:08.175] Tell me I'm a little angel\n[00:10.175] Sweetheart of your city\n[00:13.307] Say what I'm dying to hear\n[00:17.058] 'Cause I'm dying to hear you\n[00:20.523] Tell me I'm that new thing\n[00:22.571] Tell me that I'm relevant\n[00:24.723] Tell me that I got a big heart\n[00:26.723] Then back it up with evidence\n[00:29.408] I need it and I don't know why\n[00:33.907] This late at night\n[00:36.139] Isn't it lonely\n[00:38.991] I'd do anything to make you want me\n[00:43.222] I'd give it all up if you told me\n[00:47.339] That I'd be\n[00:49.157] The number one girl in your eyes\n[00:52.506] Your one and only\n[00:55.437] So what's it gon' take for you to want me\n[00:59.589] I'd give it all up if you told me\n[01:03.674] That I'd be\n[01:05.823] The number one girl in your eyes\n[01:10.841] Tell me I'm going real big places\n[01:14.055] Down to earth, so friendly\n[01:16.105] And even through all the phases\n[01:18.256] Tell me you accept me\n[01:21.155] Well, that's all I'm dying to hear\n[01:24.937] Yeah, I'm dying to hear you\n[01:28.521] Tell me that you need me\n[01:30.437] Tell me that I'm loved\n[01:32.740] Tell me that I'm worth it\n[01:34.605] And that I'm enough\n[01:37.571] I need it and I don't know why\n[01:41.889] This late at night\n[01:43.805] Isn't it lonely\n[01:46.871] I'd do anything to make you want me\n[01:51.004] I'd give it all up if you told me\n[01:55.237] That I'd be\n[01:57.089] The number one girl in your eyes\n[02:00.325] Your one and only\n[02:03.305] So what's it gon' take for you to want me\n[02:07.355] I'd give it all up if you told me\n[02:11.589] That I'd be\n[02:13.623] The number one girl in your eyes\n[02:16.804] The girl in your eyes\n[02:20.823] The girl in your eyes\n[02:26.055] Tell me I'm the number one girl\n[02:28.355] I'm the number one girl in your eyes\n[02:33.172] The girl in your eyes\n[02:37.321] The girl in your eyes\n[02:42.472] Tell me I'm the number one girl\n[02:44.539] I'm the number one girl in your eyes\n[02:49.605] Well isn't it lonely\n[02:52.488] I'd do anything to make you want me\n[02:56.637] I'd give it all up if you told me\n[03:00.888] That I'd be\n[03:03.172] The number one girl in your eyes\n[03:06.272] Your one and only\n[03:09.160] So what's it gon' take for you to want me\n[03:13.056] I'd give it all up if you told me\n[03:17.305] That I'd be\n[03:19.488] The number one girl in your eyes\n[03:25.420] The number one girl in your eyes\n"""],
338
- ["""[00:00.133]Abracadabra, abracadabra\n[00:03.985]Abracadabra, abracadabra\n[00:15.358]Pay the toll to the angels\n[00:18.694]Drawin' circles in the clouds\n[00:22.966]Keep your mind on the distance\n[00:26.321]When the devil turns around\n[00:30.540]Hold me in your heart tonight\n[00:33.751]In the magic of the dark moonlight\n[00:38.189]Save me from this empty fight\n[00:43.521]In the game of life\n[00:45.409]Like a poem said by a lady in red\n[00:49.088]You hear the last few words of your life\n[00:53.013]With a haunting dance, now you're both in a trance\n[00:56.687]It's time to cast your spell on the night\n[01:01.131]Abracadabra amor-oo-na-na\n[01:04.394]Abracadabra morta-oo-gaga\n[01:08.778]Abracadabra, abra-ooh-na-na\n[01:12.063]In her tongue, she's sayin'\n[01:14.367]Death or love tonight\n[01:18.249]Abracadabra, abracadabra\n[01:22.136]Abracadabra, abracadabra\n[01:25.859]Feel the beat under your feet\n[01:27.554]The floor's on fire\n[01:29.714]Abracadabra, abracadabra\n[01:33.464]Choose the road on the west side\n[01:36.818]As the dust flies, watch it burn\n[01:41.057]Don't waste time on feeling\n[01:44.419]Use your passion no return\n[01:48.724]Hold me in your heart tonight\n[01:51.886]In the magic of the dark moonlight\n[01:56.270]Save me from this empty fight\n[02:01.599]In the game of life\n[02:03.524]Like a poem said by a lady in red\n[02:07.192]You hear the last few words of your life\n[02:11.055]With a haunting dance, now you're both in a trance\n[02:14.786]It's time to cast your spell on the night\n[02:19.225]Abracadabra amor-oo-na-na\n[02:22.553]Abracadabra morta-oo-gaga\n[02:26.852]Abracadabra, abra-ooh-na-na\n[02:30.110]In her tongue, she's sayin'\n[02:32.494]Death or love tonight\n[02:36.244]Abracadabra, abracadabra\n[02:40.161]Abracadabra, abracadabra\n[02:43.966]Feel the beat under your feet\n[02:45.630]The floor's on fire\n[02:47.812]Abracadabra, abracadabra\n[02:50.537]Phantom of the dancefloor, come to me\n[02:58.169]Sing for me a sinful melody\n[03:05.833]Ah-ah-ah-ah-ah, ah-ah, ah-ah\n[03:13.453]Ah-ah-ah-ah-ah, ah-ah, ah-ah\n[03:22.025]Abracadabra amor-oo-na-na\n[03:25.423]Abracadabra morta-oo-gaga\n[03:29.674]Abracadabra, abra-ooh-na-na\n[03:33.013]In her tongue, she's sayin'\n[03:35.401]Death or love tonight\n"""],
339
- ["""[00:00.27]只��你太美 baby 只因你太美 baby\n[00:08.95]只因你实在是太美 baby\n[00:13.99]只因你太美 baby\n[00:18.89]迎面走来的你让我如此蠢蠢欲动\n[00:20.88]这种感觉我从未有\n[00:21.79]Cause I got a crush on you who you\n[00:25.74]你是我的我是你的谁\n[00:28.09]再多一眼看一眼就会爆炸\n[00:30.31]再近一点靠近点快被融化\n[00:32.49]想要把你占为己有 baby bae\n[00:34.60]不管走到哪里\n[00:35.44]都会想起的人是你 you you\n[00:38.12]我应该拿你怎样\n[00:39.61]Uh 所有人都在看着你\n[00:42.36]我的心总是不安\n[00:44.18]Oh 我现在已病入膏肓\n[00:46.63]Eh oh\n[00:47.84]难道真的因你而疯狂吗\n[00:51.57]我本来不是这种人\n[00:53.59]因你变成奇怪的人\n[00:55.77]第一次呀变成这样的我\n[01:01.23]不管我怎么去否认\n[01:03.21]只因你太美 baby 只因你太美 baby\n[01:11.46]只因你实在是太美 baby\n[01:16.75]只因你太美 baby\n[01:21.09]Oh eh oh\n[01:22.82]现在确认地告诉我\n[01:25.26]Oh eh oh\n[01:27.31]你到底属于谁\n[01:29.98]Oh eh oh\n[01:31.70]现在确认地告诉我\n[01:34.45]Oh eh oh\n"""],
340
- ["""[00:19.50]也想不到要怎么问你别来无恙\n[00:25.71]世界乱的一塌糊涂可是能怎样\n[00:31.85]偶尔抬起头来还好有颗月亮可赏\n[00:38.96]太多回忆要我怎么摆进行李箱\n[00:45.22]一直没哭一直走路走灰多少太阳\n[00:51.70]因为往事没有办法悬赏 隐形在那大街小巷\n[01:00.22]剪断了它还嚣张\n[01:03.85]我的嘴在说谎 说的那么漂亮\n[01:10.07]说我早就忘了你像月一样的俏脸庞\n[01:16.51]最怕一边忙呀忙一边回想那旧时光\n[01:22.87]剪不掉的是你 带泪的脸 还真是烦\n[01:43.32]多少原因将我绑在半夜屋顶上\n[01:49.23]一直没再爱一个人如今就是这样\n[01:55.75]因为故事跟你说了一半 于是搁在所谓云端\n[02:04.21]谁忘不了谁孤单\n[02:07.79]我的心在说谎 说下去会疯狂\n[02:14.02]如果没有月亮那些日子都无妨\n[02:20.43]最怕一边忙呀忙一边想那旧时光\n[02:26.91]剪不掉的是你 带笑的苦 还真烦\n[02:33.81]我的嘴又说了谎 说的那么漂亮\n[02:39.68]以为已经忘了你的那些美像月光它剪不断\n[02:47.15]因为爱早就钻进心脏 心一跳泪就会烫\n[02:52.22]那些带泪的脸 带笑的苦 还真烦\n[02:59.28]月亮是个凶手 想你的我 是通缉犯\n[03:08.03]我有时候真的很怕望见那月光中的你\n"""]
341
- ],
342
-
343
- inputs=[lrc],
344
- label="Lrc Examples",
345
- examples_per_page=4,
346
- elem_id="lrc-examples-container",
347
- )
348
 
 
349
 
350
- # page 2
351
- with gr.Tab("Lyrics Generate", id=1):
352
- with gr.Row():
353
- with gr.Column():
354
- with gr.Accordion("Notice", open=False):
355
- gr.Markdown("**Two Generation Modes:**\n1. Generate from theme & tags\n2. Add timestamps to existing lyrics")
356
-
357
- with gr.Group():
358
- gr.Markdown("### Method 1: Generate from Theme")
359
- theme = gr.Textbox(label="theme", placeholder="Enter song theme, e.g: Love and Heartbreak")
360
- tags_gen = gr.Textbox(label="tags", placeholder="Enter song tags, e.g: pop confidence healing")
361
- language = gr.Radio(["cn", "en"], label="Language", value="en")
362
- gen_from_theme_btn = gr.Button("Generate LRC (From Theme)", variant="primary")
363
-
364
- gr.Examples(
365
- examples=[
366
- [
367
- "Love and Heartbreak",
368
- "vocal emotional piano pop",
369
- "en"
370
- ],
371
- [
372
- "Heroic Epic",
373
- "choir orchestral powerful",
374
- "cn"
375
- ]
376
- ],
377
- inputs=[theme, tags_gen, language],
378
- label="Examples: Generate from Theme"
379
- )
380
-
381
- with gr.Group(visible=True):
382
- gr.Markdown("### Method 2: Add Timestamps to Lyrics")
383
- tags_lyrics = gr.Textbox(label="tags", placeholder="Enter song tags, e.g: ballad piano slow")
384
- lyrics_input = gr.Textbox(
385
- label="Raw Lyrics (without timestamps)",
386
- placeholder="Enter plain lyrics (without timestamps), e.g:\nYesterday\nAll my troubles...",
387
- lines=10,
388
- max_lines=50,
389
- elem_classes="lyrics-scroll-box"
390
- )
391
-
392
- gen_from_lyrics_btn = gr.Button("Generate LRC (From Lyrics)", variant="primary")
393
-
394
- gr.Examples(
395
- examples=[
396
- [
397
- "acoustic folk happy",
398
- """I'm sitting here in the boring room\nIt's just another rainy Sunday afternoon"""
399
- ],
400
- [
401
- "electronic dance energetic",
402
- """We're living in a material world\nAnd I am a material girl"""
403
- ]
404
- ],
405
- inputs=[tags_lyrics, lyrics_input],
406
- label="Examples: Generate from Lyrics"
407
- )
408
-
409
-
410
- with gr.Column():
411
- lrc_output = gr.Textbox(
412
- label="Generated LRC",
413
- placeholder="Timed lyrics will appear here",
414
- lines=57,
415
- elem_classes="lrc-output",
416
- show_copy_button=True
417
- )
418
-
419
- # Bind functions
420
- gen_from_theme_btn.click(
421
- fn=R1_infer1,
422
- inputs=[theme, tags_gen, language],
423
- outputs=lrc_output
424
- )
425
-
426
- gen_from_lyrics_btn.click(
427
- fn=R1_infer2,
428
- inputs=[tags_lyrics, lyrics_input],
429
- outputs=lrc_output
430
- )
431
-
432
- tabs.select(
433
- lambda s: None,
434
- None,
435
- None
436
- )
437
-
438
- lyrics_btn.click(
439
- fn=infer_music,
440
- inputs=[lrc, audio_prompt, text_prompt, current_prompt_type, seed, randomize_seed, steps, cfg_strength, file_type, odeint_method, preference_infer, Music_Duration],
441
- outputs=audio_output
442
  )
443
 
444
-
445
- if __name__ == "__main__":
446
- demo.launch()
 
 
 
 
 
 
1
  import torch
2
+ import gradio as gr
 
 
 
 
 
 
3
  import random
4
+ import traceback
5
+
6
+ # -------------------------------------------------
7
+ # FORCE CPU (FREE TIER SAFE)
8
+ # -------------------------------------------------
9
+ device = "cpu"
10
+ print("Running in CPU mode (Free tier safe)")
11
+
12
+ # -------------------------------------------------
13
+ # IMPORT YOUR ORIGINAL UTILITIES
14
+ # -------------------------------------------------
15
+ from diffrhythm.infer.infer_utils import prepare_model, infer_music
16
+
17
+ # -------------------------------------------------
18
+ # LOAD MODEL (REDUCED MEMORY MODE)
19
+ # -------------------------------------------------
20
+ try:
21
+ cfm, tokenizer, muq, vae, eval_model, eval_muq = prepare_model(
22
+ max_frames=2048, # Reduced from 6144
23
+ device=device
24
+ )
25
+ print("Model loaded successfully.")
26
+ except Exception as e:
27
+ print("Model loading failed:")
28
+ print(traceback.format_exc())
29
+ raise e
30
+
31
+ # -------------------------------------------------
32
+ # SAFE GENERATION FUNCTION
33
+ # -------------------------------------------------
34
+ def generate_music(
35
+ prompt,
36
+ duration,
37
+ guidance_scale,
38
+ seed
39
+ ):
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  try:
41
+ if seed == -1:
42
+ seed = random.randint(0, 999999)
43
+
44
+ torch.manual_seed(int(seed))
45
+
46
+ audio = infer_music(
47
+ cfm=cfm,
48
+ tokenizer=tokenizer,
49
+ muq=muq,
50
+ vae=vae,
51
+ eval_model=eval_model,
52
+ eval_muq=eval_muq,
53
+ prompt=prompt,
54
+ duration=int(duration),
55
+ guidance_scale=float(guidance_scale),
56
+ device=device
 
 
 
 
 
 
 
 
 
 
 
 
57
  )
 
 
 
 
58
 
59
+ return audio
 
 
60
 
61
+ except Exception as e:
62
+ return f"Error during generation:\n{traceback.format_exc()}"
63
 
64
+ # -------------------------------------------------
65
+ # GRADIO UI
66
+ # -------------------------------------------------
67
+ with gr.Blocks() as demo:
68
 
69
+ gr.Markdown("# 🎵 DiffRhythm (CPU Safe Version)")
70
+ gr.Markdown("Running on Free CPU mode. Generation will be slow.")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
71
 
72
+ with gr.Row():
73
+ prompt = gr.Textbox(label="Music Prompt", placeholder="Describe the music...")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
 
75
+ with gr.Row():
76
+ duration = gr.Slider(5, 30, value=10, step=1, label="Duration (seconds)")
77
+ guidance = gr.Slider(1, 10, value=5, step=0.5, label="Guidance Scale")
78
+ seed = gr.Number(value=-1, label="Seed (-1 = random)")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
79
 
80
+ generate_btn = gr.Button("Generate Music")
 
 
 
 
 
 
 
 
 
 
 
 
81
 
82
+ output_audio = gr.Audio(label="Generated Audio")
83
 
84
+ generate_btn.click(
85
+ fn=generate_music,
86
+ inputs=[prompt, duration, guidance, seed],
87
+ outputs=output_audio
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
88
  )
89
 
90
+ demo.launch()