Update app.py
Browse files
app.py
CHANGED
@@ -215,8 +215,14 @@ def infer_inp(prompt, audio_path, mask_start_point, mask_end_point, progress=gr.
|
|
215 |
# Ensure correct shape
|
216 |
denorm_spec_audio = denorm_spec_audio.flatten() # Converts (1, N) → (N,)
|
217 |
|
218 |
-
|
219 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
220 |
|
221 |
# Save as WAV
|
222 |
sf.write("output.wav", denorm_spec_audio, 16000)
|
@@ -394,6 +400,12 @@ with gr.Blocks(css=css) as demo:
|
|
394 |
outputs = [audio_in_spec]
|
395 |
)
|
396 |
|
|
|
|
|
|
|
|
|
|
|
|
|
397 |
preview_mask_btn.click(
|
398 |
fn = preview_masked_area,
|
399 |
inputs = [audio_in_inp, mask_start_point, mask_end_point],
|
|
|
215 |
# Ensure correct shape
|
216 |
denorm_spec_audio = denorm_spec_audio.flatten() # Converts (1, N) → (N,)
|
217 |
|
218 |
+
print("Original spectrogram min/max:", norm_spec.min().item(), norm_spec.max().item())
|
219 |
+
print("Generated spectrogram min/max:", output_spec.min().item(), output_spec.max().item())
|
220 |
+
|
221 |
+
global_max = max(np.max(np.abs(raw_chunk_audio)), np.max(np.abs(denorm_spec_audio)))
|
222 |
+
denorm_spec_audio = denorm_spec_audio / global_max # Normalize using a shared scale
|
223 |
+
|
224 |
+
print("Masked spectrogram min/max:", masked_spec.min().item(), masked_spec.max().item())
|
225 |
+
print("Output spectrogram min/max:", output_spec.min().item(), output_spec.max().item())
|
226 |
|
227 |
# Save as WAV
|
228 |
sf.write("output.wav", denorm_spec_audio, 16000)
|
|
|
400 |
outputs = [audio_in_spec]
|
401 |
)
|
402 |
|
403 |
+
audio_in_inp.stop_recording(
|
404 |
+
fn = load_input_spectrogram,
|
405 |
+
inputs = [audio_in_inp],
|
406 |
+
outputs = [audio_in_spec]
|
407 |
+
)
|
408 |
+
|
409 |
preview_mask_btn.click(
|
410 |
fn = preview_masked_area,
|
411 |
inputs = [audio_in_inp, mask_start_point, mask_end_point],
|