fffiloni commited on
Commit
b8ba919
·
verified ·
1 Parent(s): 9710eda

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -2
app.py CHANGED
@@ -215,8 +215,14 @@ def infer_inp(prompt, audio_path, mask_start_point, mask_end_point, progress=gr.
215
  # Ensure correct shape
216
  denorm_spec_audio = denorm_spec_audio.flatten() # Converts (1, N) → (N,)
217
 
218
- # Normalize the audio to prevent clipping or excessive loudness
219
- denorm_spec_audio = denorm_spec_audio / np.max(np.abs(denorm_spec_audio)) # Scale between -1 and 1
 
 
 
 
 
 
220
 
221
  # Save as WAV
222
  sf.write("output.wav", denorm_spec_audio, 16000)
@@ -394,6 +400,12 @@ with gr.Blocks(css=css) as demo:
394
  outputs = [audio_in_spec]
395
  )
396
 
 
 
 
 
 
 
397
  preview_mask_btn.click(
398
  fn = preview_masked_area,
399
  inputs = [audio_in_inp, mask_start_point, mask_end_point],
 
215
  # Ensure correct shape
216
  denorm_spec_audio = denorm_spec_audio.flatten() # Converts (1, N) → (N,)
217
 
218
+ print("Original spectrogram min/max:", norm_spec.min().item(), norm_spec.max().item())
219
+ print("Generated spectrogram min/max:", output_spec.min().item(), output_spec.max().item())
220
+
221
+ global_max = max(np.max(np.abs(raw_chunk_audio)), np.max(np.abs(denorm_spec_audio)))
222
+ denorm_spec_audio = denorm_spec_audio / global_max # Normalize using a shared scale
223
+
224
+ print("Masked spectrogram min/max:", masked_spec.min().item(), masked_spec.max().item())
225
+ print("Output spectrogram min/max:", output_spec.min().item(), output_spec.max().item())
226
 
227
  # Save as WAV
228
  sf.write("output.wav", denorm_spec_audio, 16000)
 
400
  outputs = [audio_in_spec]
401
  )
402
 
403
+ audio_in_inp.stop_recording(
404
+ fn = load_input_spectrogram,
405
+ inputs = [audio_in_inp],
406
+ outputs = [audio_in_spec]
407
+ )
408
+
409
  preview_mask_btn.click(
410
  fn = preview_masked_area,
411
  inputs = [audio_in_inp, mask_start_point, mask_end_point],