fffiloni commited on
Commit
dde3732
·
verified ·
1 Parent(s): 51755b8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -2
app.py CHANGED
@@ -85,8 +85,18 @@ def infer_img2img(prompt, audio_path, desired_strength, progress=gr.Progress(tra
85
  audio, sampling_rate = load_wav(audio_path)
86
  audio, spec = get_mel_spectrogram_from_audio(audio)
87
 
88
- #norm_spec = normalize_spectrogram(spec)
89
- norm_spec = debug_spectrogram(audio, spec, "Your File")
 
 
 
 
 
 
 
 
 
 
90
 
91
  # norm_spec = norm_spec[:,:, width_start:width_start+width]
92
  norm_spec = pad_spec(norm_spec, 1024)
 
85
  audio, sampling_rate = load_wav(audio_path)
86
  audio, spec = get_mel_spectrogram_from_audio(audio)
87
 
88
+ # Check if the spectrogram mean before normalization is too low
89
+ spec_mean_before = spec.mean().item()
90
+
91
+ # Apply fix only if the spectrogram mean is too low
92
+ if spec_mean_before < -5.0:
93
+ print(f"⚠️ Spectrogram too low (Mean: {spec_mean_before}). Applying boost!")
94
+ spec = spec * 1.5 # Adjust multiplier if needed
95
+ else:
96
+ print(f"✅ Spectrogram looks normal (Mean: {spec_mean_before}). No boost needed.")
97
+
98
+ # Normalize the spectrogram
99
+ norm_spec = normalize_spectrogram(spec)
100
 
101
  # norm_spec = norm_spec[:,:, width_start:width_start+width]
102
  norm_spec = pad_spec(norm_spec, 1024)