Spaces:

sbenfenatti
/

sintonIA

Sleeping

App Files Files Community

sbenfenatti commited on Jul 12

Commit

f58a75c

verified ·

1 Parent(s): 44fc68a

Update app.py

Browse files

Files changed (1) hide show

app.py +292 -134

app.py CHANGED Viewed

@@ -1,148 +1,306 @@
-import os
-import io
-import base64
-import tempfile
-import logging
-import json
-import asyncio
-from fastapi import FastAPI, File, UploadFile, HTTPException
 from fastapi.responses import FileResponse, JSONResponse
-from dotenv import load_dotenv
-from faster_whisper import WhisperModel
 import google.generativeai as genai
-import edge_tts
 # ---------- Configuração Inicial ----------
-load_dotenv()
-CACHE_DIR = os.getenv("HF_HUB_CACHE", "./models_cache")
-os.environ["MPLCONFIGDIR"] = os.path.join(CACHE_DIR, "matplotlib")
-LOGIN_PASSWORDS = os.getenv("LOGIN_PASSWORDS")
-GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")
 # ---------- Aplicação FastAPI ----------
 app = FastAPI()
-logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
 # ---------- Carregamento de Modelos (no arranque) ----------
-whisper_model = None
-gemini_model = None
-@app.on_event("startup")
-def load_models():
-    global whisper_model, gemini_model
-    logging.info("A carregar modelos e clientes de API...")
-    try:
-        model_name = "medium"
-        whisper_model = WhisperModel(model_name, device="cpu", compute_type="int8")
-        logging.info(f"Modelo faster-whisper '{model_name}' (int8) pronto.")
-    except Exception as e:
-        logging.error(f"Falha ao iniciar o modelo faster-whisper: {e}")
-        raise RuntimeError("Não foi possível carregar o modelo Whisper.") from e
-    if GOOGLE_API_KEY:
-        try:
-            genai.configure(api_key=GOOGLE_API_KEY)
-            gemini_model = genai.GenerativeModel("gemini-1.5-flash")
-            logging.info("Gemini pronto.")
-        except Exception as e:
-            logging.error(f"Falha ao iniciar Gemini: {e}")
-            raise RuntimeError("Não foi possível carregar o modelo Gemini.") from e
-    logging.info("Modelos carregados com sucesso.")
 # ---------- Utilidades ----------
-def ask_gemini(question: str) -> str:
-    if not gemini_model:
-        raise HTTPException(status_code=503, detail="Modelo de linguagem não está disponível.")
-    prompt = (
-        "Você é 'SintonIA', um assistente de IA por voz para saúde bucal. "
-        "Responda de forma empática, clara e segura, em 2-3 frases. "
-        "NUNCA dê diagnóstico e sempre recomende consulta presencial a um dentista."
-    )
-    try:
-        response = gemini_model.generate_content([prompt, question])
-        return response.text
-    except Exception as e:
-        logging.error(f"Erro no Gemini: {e}")
-        raise HTTPException(status_code=500, detail="Erro ao gerar a resposta de IA.")
-VOICE = "pt-BR-AntonioNeural"
 async def synthesize(text: str) -> bytes | None:
-    try:
-        audio_bytes = b""
-        communicate = edge_tts.Communicate(text, VOICE)
-        async for chunk in communicate.stream():
-            if chunk["type"] == "audio":
-                audio_bytes += chunk["data"]
-        return audio_bytes
-    except Exception as e:
-        logging.error(f"Erro ao sintetizar áudio com Edge TTS: {e}")
-        return None
 # ---------- Rotas (Endpoints) ----------
 @app.get("/")
-async def read_index():
-    return FileResponse('index.html')
 @app.post("/login")
 async def login(request: dict):
-    if not LOGIN_PASSWORDS:
-        return {"success": True}
-    valid_passwords = [p.strip() for p in LOGIN_PASSWORDS.split(',')]
-    pwd_received = request.get("password", "")
-    if pwd_received not in valid_passwords:
-        raise HTTPException(status_code=401, detail="Senha incorreta.")
-    return {"success": True}
 @app.post("/process-audio")
-async def process_audio(audio: UploadFile = File(...)):
-    if not all([whisper_model, gemini_model]):
-        raise HTTPException(status_code=503, detail="Um serviço de IA não está disponível.")
-    try:
-        with tempfile.NamedTemporaryFile(delete=True, suffix=".webm") as tmp_file:
-            content = await audio.read()
-            tmp_file.write(content)
-            tmp_file.seek(0)
-            # Always transcribe, wrapping glossary in an extra list
-            glossary = [[
-                "endodontia", "periodontite", "prótese",
-                "ibuprofeno", "dipirona", "paracetamol", "naproxeno", "aspirina", "diclofenaco",
-                "amoxicilina", "amoxicilina+clavulanato", "clindamicina", "azitromicina",
-                "metronidazol", "penicilina V", "cefalexina",
-                "tramadol", "codeína"
-            ]]
-            segments, _ = whisper_model.transcribe(
-                tmp_file.name,
-                language="pt",
-                initial_prompt=glossary
-            )
-            transcribed_parts = [segment.text for segment in segments]
-            text = "".join(transcribed_parts).strip()
-            logging.info(f"Texto transcrito: '{text}'")
-    except Exception as e:
-        logging.error(f"Erro na transcrição do faster-whisper: {e}")
-        text = ""
-    if not text:
-        ai_text = "Desculpe, não entendi o que foi dito. Você poderia repetir, por favor?"
-    else:
-        ai_text = ask_gemini(text)
-    audio_bytes = None
-    if ai_text:
-        audio_bytes = await synthesize(ai_text)
-    return JSONResponse(content={
-        "user_question": text,
-        "ai_answer": ai_text,
-        "audio_base64": base64.b64encode(audio_bytes).decode('utf-8') if audio_bytes else None
-    })
 @app.get("/healthz")
-async def health_check():
-    return {"status": "OK"}

+import os, io, base64, tempfile, logging, json, asyncio
+from fastapi import FastAPI, File, UploadFile, Form, HTTPException
 from fastapi.responses import FileResponse, JSONResponse
+from dotenv import load
+dotenv
+_
+from faster
+_
+whisper import WhisperModel
 import google.generativeai as genai
+import edge
+tts
+_
 # ---------- Configuração Inicial ----------
+load
+dotenv()
+_
+CACHE
+_
+DIR = os.getenv("HF
+HUB
+CACHE"
+,
+"
+./models
+_
+_
+os.environ["MPLCONFIGDIR"] = os.path.join(CACHE
+_
+cache")
+_
+DIR,
+"matplotlib")
+LOGIN
+_
+PASSWORDS = os.getenv("LOGIN
+_
+GOOGLE
+API
+_
+_
+KEY = os.getenv("GOOGLE
+_
+_
+PASSWORDS")
+API
+KEY")
 # ---------- Aplicação FastAPI ----------
 app = FastAPI()
+logging.basicConfig(level=logging.INFO, format=
+"%(asctime)s - %(levelname)s -
+%(message)s")
 # ---------- Carregamento de Modelos (no arranque) ----------
+whisper
+model = None
+_
+gemini
+model = None
+_
+@app.on
+_
+event("startup")
+def load
+models():
+_
+global whisper
+_
+model, gemini
+model
+_
+logging.info("A carregar modelos e clientes de API...
+")
+try:
+model
+name =
+"medium"
+_
+whisper
+_
+model = WhisperModel(model
+name, device=
+_
+"cpu"
+,
+compute
+_
+type=
+"int8")
+logging.info(f"Modelo faster-whisper '{model
+_
+name}' (int8) pronto.
+")
+except Exception as e:
+logging.error(f"Falha ao iniciar o modelo faster-whisper: {e}")
+raise RuntimeError("Não foi possível carregar o modelo Whisper.
+") from e
+if GOOGLE
+API
+KEY:
+_
+_
+try:
+genai.configure(api
+_
+key=GOOGLE
+API
+KEY)
+_
+_
+gemini
+_
+model = genai.GenerativeModel("gemini-1.5-flash")
+logging.info("Gemini pronto.
+")
+except Exception as e:
+logging.error(f"Falha ao iniciar Gemini: {e}")
+raise RuntimeError("Não foi possível carregar o modelo Gemini.
+") from e
+logging.info("Modelos carregados com sucesso.
+")
 # ---------- Utilidades ----------
+def ask
+_gemini(question: str) -> str:
+if not gemini
+model:
+_
+raise HTTPException(status
+code=503, detail=
+_
+"Modelo de linguagem não está
+disponível.
+")
+prompt = ("Você é 'SintonIA'
+, um assistente de IA por voz para saúde bucal.
+"
+"Responda de forma empática, clara e segura, em 2-3 frases.
+"
+"NUNCA dê diagnóstico e sempre recomende consulta presencial a um
+dentista.
+")
+try:
+response = gemini
+_
+model.generate
+_
+content([prompt, question])
+return response.text
+except Exception as e:
+logging.error(f"Erro no Gemini: {e}")
+raise HTTPException(status
+code=500, detail=
+_
+"Erro ao gerar a resposta de IA.
+")
+VOICE =
+"pt-BR-AntonioNeural"
 async def synthesize(text: str) -> bytes | None:
+try:
+audio
+_
+bytes = b""
+communicate = edge
+tts.Communicate(text, VOICE)
+_
+async for chunk in communicate.stream():
+if chunk["type"] ==
+"audio":
+audio
+_
+bytes += chunk["data"]
+return audio
+_
+bytes
+except Exception as e:
+logging.error(f"Erro ao sintetizar áudio com Edge TTS: {e}")
+return None
 # ---------- Rotas (Endpoints) ----------
 @app.get("/")
+async def read
+index():
+_
+return FileResponse('index.html')
 @app.post("/login")
 async def login(request: dict):
+if not LOGIN
+PASSWORDS:
+_
+return {"success": True}
+valid
+_passwords = [p.strip() for p in LOGIN
+_
+PASSWORDS.split('
+,
+')]
+pwd
+_
+received = request.get("password"
+,
+"")
+is
+_
+ok = pwd
+received in valid
+_
+_passwords
+if not is
+ok:
+_
+raise HTTPException(status
+code=401, detail=
+"Senha incorreta.
+")
+_
+return {"success": True}
 @app.post("/process-audio")
+async def process
+_
+audio(audio: UploadFile = File(...)):
+if not all([whisper
+_
+model, gemini
+model]):
+_
+raise HTTPException(status
+code=503, detail=
+_
+"Um serviço de IA não está
+disponível.
+")
+try:
+with tempfile.NamedTemporaryFile(delete=True, suffix=
+"
+.webm") as tmp_
+file:
+content = await audio.read()
+tmp_
+file.write(content)
+tmp_
+file.seek(0)
+if os.path.getsize(tmp_
+file.name) > 1000:
+segments,
+_
+= whisper
+_
+model.transcribe(tmp_
+file.name, language=
+"pt")
+transcribed
+_parts = [segment.text for segment in segments]
+text =
+""
+.join(transcribed
+_parts).strip()
+logging.info(f"Texto transcrito: '{text}'")
+else:
+text =
+""
+except Exception as e:
+logging.error(f"Erro na transcrição do faster-whisper: {e}")
+text =
+""
+if not text:
+ai
+_
+else:
+ai
+text =
+_
+"Desculpe, não entendi o que foi dito. Você poderia repetir, por favor?"
+text = ask
+_gemini(text)
+audio
+_
+if ai
+text:
+_
+audio
+bytes = None
+_
+bytes = await synthesize(ai
+text)
+_
+# --- LÓGICA FINAL: Retorna um JSON com todos os dados ---
+return JSONResponse(content={
+"user
+_question": text,
+"ai
+answer": ai
+text,
+_
+_
+"audio
+base64": base64.b64encode(audio
+_
+_
+bytes).decode('utf-8') if audio
+_
+else None
+bytes
+})
 @app.get("/healthz")
+async def health
+check():
+_
+return {"status": "OK"}