Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -215,8 +215,14 @@ def infer_inp(prompt, audio_path, mask_start_point, mask_end_point, progress=gr.
|
|
| 215 |
# Ensure correct shape
|
| 216 |
denorm_spec_audio = denorm_spec_audio.flatten() # Converts (1, N) → (N,)
|
| 217 |
|
| 218 |
-
|
| 219 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 220 |
|
| 221 |
# Save as WAV
|
| 222 |
sf.write("output.wav", denorm_spec_audio, 16000)
|
|
@@ -394,6 +400,12 @@ with gr.Blocks(css=css) as demo:
|
|
| 394 |
outputs = [audio_in_spec]
|
| 395 |
)
|
| 396 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 397 |
preview_mask_btn.click(
|
| 398 |
fn = preview_masked_area,
|
| 399 |
inputs = [audio_in_inp, mask_start_point, mask_end_point],
|
|
|
|
| 215 |
# Ensure correct shape
|
| 216 |
denorm_spec_audio = denorm_spec_audio.flatten() # Converts (1, N) → (N,)
|
| 217 |
|
| 218 |
+
print("Original spectrogram min/max:", norm_spec.min().item(), norm_spec.max().item())
|
| 219 |
+
print("Generated spectrogram min/max:", output_spec.min().item(), output_spec.max().item())
|
| 220 |
+
|
| 221 |
+
global_max = max(np.max(np.abs(raw_chunk_audio)), np.max(np.abs(denorm_spec_audio)))
|
| 222 |
+
denorm_spec_audio = denorm_spec_audio / global_max # Normalize using a shared scale
|
| 223 |
+
|
| 224 |
+
print("Masked spectrogram min/max:", masked_spec.min().item(), masked_spec.max().item())
|
| 225 |
+
print("Output spectrogram min/max:", output_spec.min().item(), output_spec.max().item())
|
| 226 |
|
| 227 |
# Save as WAV
|
| 228 |
sf.write("output.wav", denorm_spec_audio, 16000)
|
|
|
|
| 400 |
outputs = [audio_in_spec]
|
| 401 |
)
|
| 402 |
|
| 403 |
+
audio_in_inp.stop_recording(
|
| 404 |
+
fn = load_input_spectrogram,
|
| 405 |
+
inputs = [audio_in_inp],
|
| 406 |
+
outputs = [audio_in_spec]
|
| 407 |
+
)
|
| 408 |
+
|
| 409 |
preview_mask_btn.click(
|
| 410 |
fn = preview_masked_area,
|
| 411 |
inputs = [audio_in_inp, mask_start_point, mask_end_point],
|