Spaces:

YoniAfek
/

hebrew-chat

Runtime error

App Files Files Community

Yoni commited on Apr 1

Commit

05c9154

1 Parent(s): 3f8595e

no message

Browse files

Files changed (2) hide show

app.py +8 -18
requirements.txt +2 -0

app.py CHANGED Viewed

@@ -1,21 +1,11 @@
 # -*- coding: utf-8 -*-
-import os
-import zipfile
 import gradio as gr
 from faster_whisper import WhisperModel
 import tempfile
 from huggingface_hub import hf_hub_download
-import subprocess
-import sys
-# Unzip and install cleaned israwave
-if not os.path.exists("israwave-main"):
-    with zipfile.ZipFile("israwave-clean.zip", "r") as zip_ref:
-        zip_ref.extractall(".")
-    # subprocess.check_call([sys.executable, "-m", "pip", "install", "./israwave-clean"])
-# Only after install, import israwave
-from israwave import IsrawaveTTS
 # Download model files from HF dataset (YoniAfek/israwaveTTS)
 espeak_zip_path = hf_hub_download(repo_id="YoniAfek/israwaveTTS", filename="espeak-ng-data.zip")
@@ -28,17 +18,17 @@ os.makedirs(espeak_dir, exist_ok=True)
 with zipfile.ZipFile(espeak_zip_path, "r") as zip_ref:
     zip_ref.extractall(espeak_dir)
-# Load whisper
 whisper_model = WhisperModel("ivrit-ai/whisper-large-v3-turbo-ct2")
-# Load israwave TTS
 tts = IsrawaveTTS(
     model_path=israwave_path,
     speaker_model_path=nakdimon_path,
     espeak_data_path=espeak_dir
 )
-# Transcribe + speak
 def process_audio(audio_path):
     segments, _ = whisper_model.transcribe(audio_path, language="he")
     text = " ".join([seg.text for seg in segments])
@@ -46,11 +36,11 @@ def process_audio(audio_path):
     tts.tts_to_file(text, tts_path)
     return text, tts_path
-# Interface
 demo = gr.Interface(
     fn=process_audio,
     inputs=gr.Audio(type="filepath", label="🎙️ הקלט את עצמך"),
-    outputs=[gr.Text(label="תמלול"), gr.Audio(label="השמעה בקול עברי")],
     title="תמלול ודיבור עם Israwave",
     description="המערכת מתמללת את מה שנאמר ומשמיעה אותו חזרה בקול עברי. הקבצים יורדים מ-Hugging Face Datasets"
 )

 # -*- coding: utf-8 -*-
 import gradio as gr
 from faster_whisper import WhisperModel
+from israwave import IsrawaveTTS
 import tempfile
+import os
+import zipfile
 from huggingface_hub import hf_hub_download
 # Download model files from HF dataset (YoniAfek/israwaveTTS)
 espeak_zip_path = hf_hub_download(repo_id="YoniAfek/israwaveTTS", filename="espeak-ng-data.zip")
 with zipfile.ZipFile(espeak_zip_path, "r") as zip_ref:
     zip_ref.extractall(espeak_dir)
+# Load Whisper model
 whisper_model = WhisperModel("ivrit-ai/whisper-large-v3-turbo-ct2")
+# Load Israwave TTS
 tts = IsrawaveTTS(
     model_path=israwave_path,
     speaker_model_path=nakdimon_path,
     espeak_data_path=espeak_dir
 )
+# Transcribe + TTS
 def process_audio(audio_path):
     segments, _ = whisper_model.transcribe(audio_path, language="he")
     text = " ".join([seg.text for seg in segments])
     tts.tts_to_file(text, tts_path)
     return text, tts_path
+# Gradio interface
 demo = gr.Interface(
     fn=process_audio,
     inputs=gr.Audio(type="filepath", label="🎙️ הקלט את עצמך"),
+    outputs=[gr.Text(label="תמלול"), gr.Audio(label="חזרה בקול עברי")],
     title="תמלול ודיבור עם Israwave",
     description="המערכת מתמללת את מה שנאמר ומשמיעה אותו חזרה בקול עברי. הקבצים יורדים מ-Hugging Face Datasets"
 )

requirements.txt CHANGED Viewed

@@ -1,3 +1,5 @@
 gradio
 faster-whisper
 huggingface_hub

 gradio
 faster-whisper
 huggingface_hub
+numpy
+onnxruntime