Spaces:

NaikPriyank
/

ConvoTrack

Running

App Files Files Community

NaikPriyank commited on 6 days ago

Commit

4b84617

verified ·

1 Parent(s): 2958b31

Update genAI.py

Browse files

Added the text-to-speech model feature for every response generated by the model.

Files changed (1) hide show

genAI.py +32 -0

genAI.py CHANGED Viewed

@@ -149,6 +149,21 @@ def load_and_preprocess(uploaded_file):
                 for item in data if item["text"].strip()]
     return data, passages
 def load_model(model_name="BAAI/bge-m3"):
     tokenizer = AutoTokenizer.from_pretrained(model_name)
@@ -250,6 +265,7 @@ def main():
     if st.session_state.faiss_index:
         st.header("Ask a Question")
         user_query = st.text_input("Type your question here:")
         if user_query:
             response = handle_userinput(user_query)
@@ -259,6 +275,12 @@ def main():
             st.session_state.chat_history_ui.append({"role": "user", "content": user_query})
             st.session_state.chat_history_ui.append({"role": "bot", "content": response})
     if "chat_history_ui" in st.session_state:
@@ -267,6 +289,16 @@ def main():
                 message(chat["content"], is_user=True,key=f"user_{i}")
             else:
                 message(chat["content"], is_user=False,key=f"bot_{i}")
 if __name__ == "__main__":

                 for item in data if item["text"].strip()]
     return data, passages
+def generate_text_to_speech(text):
+  API_KEY = 'sk_926210280a2b0e013545e33350ae35c73a080b0f24f9542e'
+  VOICE_ID = 'TX3LPaxmHKxFdv7VOQHJ'
+  url = f"https://api.elevenlabs.io/v1/text-to-speech/{VOICE_ID}"
+  headers = {
+    "Content-Type": "application/json",
+    "xi-api-key": API_KEY
+  }
+  payload = {
+        "text": text,
+        "model_id": "eleven_monolingual_v1",
+        "voice_settings": {"stability": 0.5, "similarity_boost": 0.75}
+    }
+  response = requests.post(url, headers=headers, json=payload)
+  return response.content if response.status_code == 200 else None
 def load_model(model_name="BAAI/bge-m3"):
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     if st.session_state.faiss_index:
         st.header("Ask a Question")
         user_query = st.text_input("Type your question here:")
+        play_audio = st.checkbox("🔊 Generate audio for the response")
         if user_query:
             response = handle_userinput(user_query)
             st.session_state.chat_history_ui.append({"role": "user", "content": user_query})
             st.session_state.chat_history_ui.append({"role": "bot", "content": response})
+            if play_audio:
+                if "audio_cache" not in st.session_state:
+                    st.session_state.audio_cache = {}
+                if response not in st.session_state.audio_cache:
+                    audio_bytes = generate_text_to_speech(response)
+                    st.session_state.audio_cache[response] = audio_bytes
     if "chat_history_ui" in st.session_state:
                 message(chat["content"], is_user=True,key=f"user_{i}")
             else:
                 message(chat["content"], is_user=False,key=f"bot_{i}")
+                audio_bytes = st.session_state.get("audio_cache", {}).get(chat["content"])
+                if audio_bytes:
+                    st.audio(audio_bytes, format="audio/mpeg",start_time=0)
+                else:
+                    if st.button(f"🔊 Generate & Play Audio for Response {i}"):
+                        audio = generate_text_to_speech(chat["content"])
+                        if "audio_cache" not in st.session_state:
+                            st.session_state.audio_cache = {}
+                        st.session_state.audio_cache[chat["content"]] = audio
+                        st.audio(audio, format="audio/mpeg", start_time=0)
 if __name__ == "__main__":