Spaces:
Running on Zero
Running on Zero
Update app.py
Browse files
app.py
CHANGED
|
@@ -85,8 +85,18 @@ def infer_img2img(prompt, audio_path, desired_strength, progress=gr.Progress(tra
|
|
| 85 |
audio, sampling_rate = load_wav(audio_path)
|
| 86 |
audio, spec = get_mel_spectrogram_from_audio(audio)
|
| 87 |
|
| 88 |
-
#
|
| 89 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 90 |
|
| 91 |
# norm_spec = norm_spec[:,:, width_start:width_start+width]
|
| 92 |
norm_spec = pad_spec(norm_spec, 1024)
|
|
|
|
| 85 |
audio, sampling_rate = load_wav(audio_path)
|
| 86 |
audio, spec = get_mel_spectrogram_from_audio(audio)
|
| 87 |
|
| 88 |
+
# Check if the spectrogram mean before normalization is too low
|
| 89 |
+
spec_mean_before = spec.mean().item()
|
| 90 |
+
|
| 91 |
+
# Apply fix only if the spectrogram mean is too low
|
| 92 |
+
if spec_mean_before < -5.0:
|
| 93 |
+
print(f"⚠️ Spectrogram too low (Mean: {spec_mean_before}). Applying boost!")
|
| 94 |
+
spec = spec * 1.5 # Adjust multiplier if needed
|
| 95 |
+
else:
|
| 96 |
+
print(f"✅ Spectrogram looks normal (Mean: {spec_mean_before}). No boost needed.")
|
| 97 |
+
|
| 98 |
+
# Normalize the spectrogram
|
| 99 |
+
norm_spec = normalize_spectrogram(spec)
|
| 100 |
|
| 101 |
# norm_spec = norm_spec[:,:, width_start:width_start+width]
|
| 102 |
norm_spec = pad_spec(norm_spec, 1024)
|