Spaces:

candenizkocak
/

chat_with_llama_3.2_using_whisper

Running

App Files Files Community

candenizkocak commited on Aug 10, 2024

Commit

1f2ea7d

verified ·

1 Parent(s): 3911815

Create app.py

Browse files

Files changed (1) hide show

app.py +81 -0

app.py ADDED Viewed

	@@ -0,0 +1,81 @@

+import os
+import gradio as gr
+from groq import Groq
+# Retrieve API key from environment variable
+api_key = os.getenv("GROQ_API_KEY")
+client = Groq(api_key=api_key)
+if not api_key:
+    raise ValueError("API key not found. Please set the GROQ_API_KEY environment variable.")
+#client = Groq(api_key=api_key)
+chat_history = []
+def transcribe_audio(file_path):
+    with open(file_path, "rb") as file:
+        transcription = client.audio.transcriptions.create(
+            file=(file_path, file.read()),
+            model="whisper-large-v3",
+            response_format="verbose_json",
+        )
+        return transcription.text
+def get_chat_completion(prompt):
+    completion = client.chat.completions.create(
+        model="llama-3.1-8b-instant",
+        messages=[
+            {
+                "role": "user",
+                "content": prompt
+            }
+        ],
+        temperature=1,
+        max_tokens=1024,
+        top_p=1,
+        stream=True,
+        stop=None,
+    )
+    response = ""
+    for chunk in completion:
+        response += chunk.choices[0].delta.content or ""
+    return response
+def process_input(audio_file, text_input):
+    global chat_history
+    if audio_file is not None:
+        transcription_text = transcribe_audio(audio_file)
+    else:
+        transcription_text = text_input
+    chat_response = get_chat_completion(transcription_text)
+    chat_history.append(("👤", transcription_text))
+    chat_history.append(("🤖", chat_response))
+    # Format chat history for display
+    formatted_history = "\n".join([f"{role}: {content}\n" for role, content in chat_history])
+    # Return chat history and instructions to clear inputs
+    return formatted_history, gr.update(value=None), gr.update(value='')
+# Create Gradio interface
+interface = gr.Interface(
+    fn=process_input,
+    inputs=[
+        gr.Audio(type="filepath", label="Upload Audio or Record"),
+        gr.Textbox(lines=2, placeholder="Or type text here", label="Text Input")
+    ],
+    outputs=[
+        gr.Textbox(label="Chat History", lines=20),
+        gr.Audio(visible=False),  # Hidden output to reset audio input
+        gr.Textbox(visible=False)  # Hidden output to reset text input
+    ],
+    title="Chat with Llama 3.1-8B With Text or Voice (Whisper Large-v3)",
+    description="Upload an audio file or type text to get a chat response based on the transcription."
+)
+if __name__ == "__main__":
+    interface.launch()