Spaces:

yamashiro3
/

Whisper-gpt-voicescribe

Build error

App Files Files Community

yama commited on Jun 30, 2023

Commit

7943b58

1 Parent(s): 6006f4b

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -2

app.py CHANGED Viewed

@@ -26,6 +26,7 @@ import wave
 import contextlib
 from transformers import pipeline
 import psutil
 whisper_models = ["tiny", "base", "small", "medium", "large-v1", "large-v2"]
 source_languages = {
@@ -351,6 +352,22 @@ def speech_to_text(video_file_path, selected_source_lang, whisper_model, num_spe
         raise RuntimeError("Error Running inference with local model", e)
 # ---- Gradio Layout -----
 # Inspiration from https://huggingface.co/spaces/RASMUS/Whisper-youtube-crosslingual-subtitles
 video_in = gr.Video(label="Video file", mirror_webcam=False)
@@ -375,7 +392,7 @@ openai_prompt_in = gr.TextArea(label="openai_prompt", value="""会議の文字
                                 - 会議の目的
                                 - 会議の内容
                                 - 会議の結果""")
-transcription_summary = gr.Textbox(label="summary")
 title = "Whisper speaker diarization"
 demo = gr.Blocks(title=title)
 demo.encrypt = False
@@ -445,7 +462,8 @@ with demo:
                 transcription_df.render()
                 openai_key_in.render()
                 openai_prompt_in.render()
-                transcription_summary.render()
                 system_info.render()
                 gr.Markdown(
                     '''<center><img src='https://visitor-badge.glitch.me/badge?page_id=WhisperDiarizationSpeakers' alt='visitor badge'><a href="https://opensource.org/licenses/Apache-2.0"><img src='https://img.shields.io/badge/License-Apache_2.0-blue.svg' alt='License: Apache 2.0'></center>''')

 import contextlib
 from transformers import pipeline
 import psutil
+import openai
 whisper_models = ["tiny", "base", "small", "medium", "large-v1", "large-v2"]
 source_languages = {
         raise RuntimeError("Error Running inference with local model", e)
+def create_transcription_summary(openai_key, prompt):
+    openai.api_key = openai_key
+    system_template = prompt
+    transcript_text = ""
+    completion = openai.ChatCompletion.create(
+        model="gpt-3.5-turbo",
+        messages=[
+            {"role": "system", "content": system_template},
+            {"role": "user", "content": transcript_text}
+        ]
+    )
+    transcript_summary = completion.choices[0].message.content
+    return transcript_summary
 # ---- Gradio Layout -----
 # Inspiration from https://huggingface.co/spaces/RASMUS/Whisper-youtube-crosslingual-subtitles
 video_in = gr.Video(label="Video file", mirror_webcam=False)
                                 - 会議の目的
                                 - 会議の内容
                                 - 会議の結果""")
+transcription_summary_out = gr.Textbox(label="transcription_summary")
 title = "Whisper speaker diarization"
 demo = gr.Blocks(title=title)
 demo.encrypt = False
                 transcription_df.render()
                 openai_key_in.render()
                 openai_prompt_in.render()
+                transcription_summary_btn = gr.Button("Evaluate and analyze transcription content")
+                transcription_summary_out.render()
                 system_info.render()
                 gr.Markdown(
                     '''<center><img src='https://visitor-badge.glitch.me/badge?page_id=WhisperDiarizationSpeakers' alt='visitor badge'><a href="https://opensource.org/licenses/Apache-2.0"><img src='https://img.shields.io/badge/License-Apache_2.0-blue.svg' alt='License: Apache 2.0'></center>''')