Spaces:

candenizkocak
/

chat_with_llama_3.2_using_whisper

Sleeping

App Files Files Community

candenizkocak commited on Oct 20, 2024

Commit

f276112

verified ·

1 Parent(s): 65134ea

Update app.py

Browse files

Files changed (1) hide show

app.py +72 -136

app.py CHANGED Viewed

@@ -1,139 +1,75 @@
-import gradio as gr
-import uuid
-from typing import Sequence
-from langchain.chains import create_history_aware_retriever, create_retrieval_chain
-from langchain.chains.combine_documents import create_stuff_documents_chain
-from langchain_community.document_loaders import TextLoader
-from langchain_core.messages import AIMessage, BaseMessage, HumanMessage
-from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
-from langchain_core.vectorstores import InMemoryVectorStore
-from langchain_groq import ChatGroq
-from langchain_huggingface import HuggingFaceEmbeddings
-from langchain_text_splitters import RecursiveCharacterTextSplitter
-from langgraph.checkpoint.memory import MemorySaver
-from langgraph.graph import START, StateGraph
-from langgraph.graph.message import add_messages
-from typing_extensions import Annotated, TypedDict
 import os
-GROQ_API_KEY = os.getenv("GROQ_API_KEY")
-llm = ChatGroq(model="llama-3.2-11b-text-preview", api_key=GROQ_API_KEY, temperature=0)
-### Construct retriever ###
-loader = TextLoader("stj.txt")
-docs = loader.load()
-model_name = "sentence-transformers/all-MiniLM-L6-v2"
-model_kwargs = {'device': 'cpu'}
-encode_kwargs = {'normalize_embeddings': False}
-hf = HuggingFaceEmbeddings(
-    model_name=model_name,
-    model_kwargs=model_kwargs,
-    encode_kwargs=encode_kwargs
-)
-text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
-splits = text_splitter.split_documents(docs)
-vectorstore = InMemoryVectorStore.from_documents(
-    documents=splits, embedding=hf
-)
-retriever = vectorstore.as_retriever()
-### Contextualize question ###
-contextualize_q_system_prompt = (
-    "Sohbet geçmişi ve en son kullanıcı sorusu verilirse, sohbet geçmişine atıfta bulunabilecek en son kullanıcı sorusunu, sohbet geçmişi olmadan anlaşılabilecek bağımsız bir soru haline getirin. Soruyu yanıtlamayın, sadece yeniden düzenleyin ve gerekirse geri döndürün."
-)
-contextualize_q_prompt = ChatPromptTemplate.from_messages(
-    [
-        ("system", contextualize_q_system_prompt),
-        MessagesPlaceholder("chat_history"),
-        ("human", "{input}"),
-    ]
-)
-history_aware_retriever = create_history_aware_retriever(
-    llm, retriever, contextualize_q_prompt
-)
-### Answer question ###
-system_prompt = (
-    "Soru-cevap görevleri için bir asistansın. Soruyu yanıtlamak için alınan aşağıdaki bağlam parçalarını kullan. Cevabı bilmiyorsan, bilmiyorum de. Cevabı üç cümleyle sınırla ve kısa tut."
-    "\n\n"
-    "{context}"
-)
-qa_prompt = ChatPromptTemplate.from_messages(
-    [
-        ("system", system_prompt),
-        MessagesPlaceholder("chat_history"),
-        ("human", "{input}"),
-    ]
-)
-question_answer_chain = create_stuff_documents_chain(llm, qa_prompt)
-rag_chain = create_retrieval_chain(history_aware_retriever, question_answer_chain)
-### Statefully manage chat history ###
-class State(TypedDict):
-    input: str
-    chat_history: Annotated[Sequence[BaseMessage], add_messages]
-    context: str
-    answer: str
-def call_model(state: State):
-    response = rag_chain.invoke(state)
-    return {
-        "chat_history": [
-            HumanMessage(state["input"]),
-            AIMessage(response["answer"]),
         ],
-        "context": response["context"],
-        "answer": response["answer"],
-    }
-workflow = StateGraph(state_schema=State)
-workflow.add_edge(START, "model")
-workflow.add_node("model", call_model)
-memory = MemorySaver()
-app = workflow.compile(checkpointer=memory)
-# Session storage
-session_storage = {}
-# Function to interact with the RAG model
-def rag_response(user_input, chat_history, session_id):
-    config = {"configurable": {"thread_id": "abc123"}}
-    # Prepare the state with input and chat history
-    state = {
-        "input": user_input,
-        "chat_history": session_storage[session_id]["chat_history"]  # Get chat history for this session
-    }
-    # Call the RAG model to get the response
-    result = app.invoke(state, config=config)
-    # Update session storage
-    session_storage[session_id]["chat_history"].append((user_input, result["answer"]))
-    return "", session_storage[session_id]["chat_history"]
-# Define the Gradio interface
-with gr.Blocks() as demo:
-    chatbox = gr.Chatbot(label="Chat History")
-    user_input = gr.Textbox(placeholder="Enter your question", label="User Input")
-    submit_button = gr.Button("Submit")
-    # Create a unique session ID
-    session_id = str(uuid.uuid4())
-    session_storage[session_id] = {"chat_history": []}
-    # Connect the button click event to the rag_response function
-    submit_button.click(rag_response, inputs=[user_input, chatbox, session_id], outputs=[user_input, chatbox])
-# Launch the Gradio app
-demo.launch()

 import os
+import gradio as gr
+from groq import Groq
+api_key = os.getenv("GROQ_API_KEY")
+client = Groq(api_key=api_key)
+if not api_key:
+    raise ValueError("API key not found. Please set the GROQ_API_KEY environment variable.")
+def transcribe_audio(file_path):
+    with open(file_path, "rb") as file:
+        transcription = client.audio.transcriptions.create(
+            file=(file_path, file.read()),
+            model="whisper-large-v3",
+            response_format="verbose_json",
+        )
+        return transcription.text
+def get_chat_completion(prompt):
+    completion = client.chat.completions.create(
+        model="llama-3.2-11b-text-preview",
+        messages=[
+            {
+                "role": "user",
+                "content": prompt
+            }
         ],
+        temperature=1,
+        max_tokens=1024,
+        top_p=1,
+        stream=True,
+        stop=None,
+    )
+    response = ""
+    for chunk in completion:
+        response += chunk.choices[0].delta.content or ""
+    return response
+def process_input(audio_file, text_input, chat_history):
+    if audio_file is not None:
+        transcription_text = transcribe_audio(audio_file)
+    else:
+        transcription_text = text_input
+    chat_response = get_chat_completion(transcription_text)
+    chat_history.append(("👤", transcription_text))
+    chat_history.append(("🤖", chat_response))
+    formatted_history = "\n".join([f"{role}: {content}\n" for role, content in chat_history])
+    return formatted_history, gr.update(value=None), gr.update(value=''), chat_history
+# Create Gradio interface
+interface = gr.Interface(
+    fn=process_input,
+    inputs=[
+        gr.Audio(type="filepath", label="Upload Audio or Record"),
+        gr.Textbox(lines=2, placeholder="Or type text here", label="Text Input"),
+        gr.State([])
+    ],
+    outputs=[
+        gr.Textbox(label="Chat History", lines=20),
+        gr.Audio(visible=False),
+        gr.Textbox(visible=False),
+        gr.State()
+    ],
+    title="Chat with Llama 3.2-11B With Text or Voice (Whisper Large-v3)",
+    description="Upload an audio file or type text to get a chat response based on the transcription.",
+    allow_flagging='never'  # Prevent flagging to isolate sessions
+)
+if __name__ == "__main__":
+    interface.launch()