Update app.py
Browse files
app.py
CHANGED
@@ -85,8 +85,18 @@ def infer_img2img(prompt, audio_path, desired_strength, progress=gr.Progress(tra
|
|
85 |
audio, sampling_rate = load_wav(audio_path)
|
86 |
audio, spec = get_mel_spectrogram_from_audio(audio)
|
87 |
|
88 |
-
#
|
89 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
90 |
|
91 |
# norm_spec = norm_spec[:,:, width_start:width_start+width]
|
92 |
norm_spec = pad_spec(norm_spec, 1024)
|
|
|
85 |
audio, sampling_rate = load_wav(audio_path)
|
86 |
audio, spec = get_mel_spectrogram_from_audio(audio)
|
87 |
|
88 |
+
# Check if the spectrogram mean before normalization is too low
|
89 |
+
spec_mean_before = spec.mean().item()
|
90 |
+
|
91 |
+
# Apply fix only if the spectrogram mean is too low
|
92 |
+
if spec_mean_before < -5.0:
|
93 |
+
print(f"⚠️ Spectrogram too low (Mean: {spec_mean_before}). Applying boost!")
|
94 |
+
spec = spec * 1.5 # Adjust multiplier if needed
|
95 |
+
else:
|
96 |
+
print(f"✅ Spectrogram looks normal (Mean: {spec_mean_before}). No boost needed.")
|
97 |
+
|
98 |
+
# Normalize the spectrogram
|
99 |
+
norm_spec = normalize_spectrogram(spec)
|
100 |
|
101 |
# norm_spec = norm_spec[:,:, width_start:width_start+width]
|
102 |
norm_spec = pad_spec(norm_spec, 1024)
|