Spaces:

LeoNguyen101120
/

ai-assistance

Paused

App Files Files Community

LeoNguyen101120 commited on May 14

Commit

16f0db6

1 Parent(s): 60924bb

Refactor Dockerfile to copy all application files into the container; add .gitignore for IDE files; update main.py and image_service.py to use OUTPUT_DIR from config; streamline file handling in process_file_service.py; remove unused OpenAI client initialization; enhance vector_store_service.py with configuration constants for improved maintainability.

Browse files

Files changed (10) hide show

.idea/.gitignore +3 -0
Dockerfile +4 -2
src/constants/config.py +15 -0
src/main.py +3 -2
src/services/chat_service.py +0 -2
src/services/image_service.py +5 -5
src/services/process_file_service.py +1 -3
src/services/vector_store_service.py +4 -11
src/utils/client.py +0 -4
src/utils/image_pipeline.py +4 -10

.idea/.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+# Default ignored files
+/shelf/
+/workspace.xml

Dockerfile CHANGED Viewed

@@ -43,8 +43,8 @@ RUN pip install --no-cache-dir --upgrade -r requirements.txt
 # Installs all Python dependencies listed in requirements.txt. --no-cache-dir reduces image size.
 # 6. Copy the rest of the application code
-COPY ./src ./src
-COPY ./README.md .
 # What is this?
 # Copies your source code and readme into the container.
@@ -54,6 +54,8 @@ EXPOSE 7860
 # What is this?
 # Documents that the container will listen on port 8080 (matches your uvicorn command).
 # 8. Set the default command to run the FastAPI app
 CMD ["fastapi", "run", "src/main.py", "--port", "7860"]

 # Installs all Python dependencies listed in requirements.txt. --no-cache-dir reduces image size.
 # 6. Copy the rest of the application code
+# COPY ./src ./src
+# COPY ./README.md .
 # What is this?
 # Copies your source code and readme into the container.
 # What is this?
 # Documents that the container will listen on port 8080 (matches your uvicorn command).
+# Copy toàn bộ mã nguồn
+COPY . .
 # 8. Set the default command to run the FastAPI app
 CMD ["fastapi", "run", "src/main.py", "--port", "7860"]

src/constants/config.py ADDED Viewed

	@@ -0,0 +1,15 @@

+# Device setup
+import torch
+TORCH_DEVICE = (
+    "cuda" if torch.cuda.is_available()
+    else "mps" if torch.backends.mps.is_available()
+    else "cpu"
+)
+IMAGE_MODEL_ID_OR_LINK = "stable-diffusion-v1-5/stable-diffusion-v1-5"
+CACHE_DIR = "/tmp/cache"
+DATA_DIR = "/tmp/data"
+EMBEDDING_MODEL = "intfloat/multilingual-e5-large-instruct"
+UPLOAD_DIR = "/tmp/uploads"
+OUTPUT_DIR = "/tmp/outputs"
+# EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"

src/main.py CHANGED Viewed

@@ -4,6 +4,7 @@ from fastapi.exceptions import RequestValidationError
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
 from fastapi.staticfiles import StaticFiles
 from models.responses.base_response import BaseResponse
 from routes import chat_routes, process_file_routes, vector_store_routes
 from utils.exception import CustomException
@@ -48,5 +49,5 @@ app.include_router(vector_store_routes.router, prefix="/api/v1")
 def read_root():
     return {"message": "Welcome my API"}
-os.makedirs("outputs", exist_ok=True)
-app.mount("/outputs", StaticFiles(directory="outputs"), name="outputs")

 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
 from fastapi.staticfiles import StaticFiles
+from constants.config import OUTPUT_DIR
 from models.responses.base_response import BaseResponse
 from routes import chat_routes, process_file_routes, vector_store_routes
 from utils.exception import CustomException
 def read_root():
     return {"message": "Welcome my API"}
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+app.mount(OUTPUT_DIR, StaticFiles(directory=OUTPUT_DIR), name="outputs")

src/services/chat_service.py CHANGED Viewed

@@ -3,8 +3,6 @@ from models.requests.chat_request import ChatRequest
 from services import vector_store_service
 from utils.timing import measure_time
 from utils.tools import tools_helper, tools_define
-from utils.client import openai_client
 def build_context_prompt(request: ChatRequest) -> list:
     """Build system prompt with context if file is provided."""

 from services import vector_store_service
 from utils.timing import measure_time
 from utils.tools import tools_helper, tools_define
 def build_context_prompt(request: ChatRequest) -> list:
     """Build system prompt with context if file is provided."""

src/services/image_service.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import os
 import time
 from utils import image_pipeline
 negative_promt = "blurry, distorted, pixelated, incomplete, poorly drawn, misaligned, weird proportions, bad perspective, unnatural colors, noisy, out of focus, glitchy, unsharp, overexposed, underexposed, poorly lit, bad composition, excessive noise, oversaturated, too dark, too bright, inconsistent lighting, discolored, overly stylized, unrealistic, awkward pose, unbalanced, mismatched, distorted features, flat, unnatural texture, chaotic, unreadable, incoherent, asymmetrical, low quality, lowres, wrong anatomy, bad anatomy, deformed, disfigured, ugly"
@@ -8,7 +9,7 @@ height = 512
 guidance_scale = 7.5
 num_inference_steps = 30
-base_url = "http://localhost:8000"
 def generate_image_url(prompt: str) -> str:
     """
@@ -16,8 +17,7 @@ def generate_image_url(prompt: str) -> str:
     :param prompt: The prompt used for generate the image (must be in English)
     :output: URL of the new image
     """
-    output_dir = "outputs"
-    os.makedirs(output_dir, exist_ok=True)
     try:
         image = image_pipeline.pipeline(
             prompt=prompt,
@@ -29,9 +29,9 @@ def generate_image_url(prompt: str) -> str:
         ).images[0]
         file_name = f"image_{int(time.time())}.png"
-        image_path = os.path.join(output_dir, file_name)
         image.save(image_path)
-        return f"{base_url}/outputs/{file_name}"
     except Exception as e:
         raise RuntimeError(f"Failed to generate image: {e}")

 import os
 import time
+from constants.config import OUTPUT_DIR
 from utils import image_pipeline
 negative_promt = "blurry, distorted, pixelated, incomplete, poorly drawn, misaligned, weird proportions, bad perspective, unnatural colors, noisy, out of focus, glitchy, unsharp, overexposed, underexposed, poorly lit, bad composition, excessive noise, oversaturated, too dark, too bright, inconsistent lighting, discolored, overly stylized, unrealistic, awkward pose, unbalanced, mismatched, distorted features, flat, unnatural texture, chaotic, unreadable, incoherent, asymmetrical, low quality, lowres, wrong anatomy, bad anatomy, deformed, disfigured, ugly"
 guidance_scale = 7.5
 num_inference_steps = 30
+base_url = "http://0.0.0.0:7860"
 def generate_image_url(prompt: str) -> str:
     """
     :param prompt: The prompt used for generate the image (must be in English)
     :output: URL of the new image
     """
+    os.makedirs(OUTPUT_DIR, exist_ok=True)
     try:
         image = image_pipeline.pipeline(
             prompt=prompt,
         ).images[0]
         file_name = f"image_{int(time.time())}.png"
+        image_path = os.path.join(OUTPUT_DIR, file_name)
         image.save(image_path)
+        return f"{base_url}/{OUTPUT_DIR}/{file_name}"
     except Exception as e:
         raise RuntimeError(f"Failed to generate image: {e}")

src/services/process_file_service.py CHANGED Viewed

@@ -6,12 +6,10 @@ from PIL import Image
 import pytesseract
 from langchain_community.document_loaders import PyMuPDFLoader
 from langchain_text_splitters import RecursiveCharacterTextSplitter
 from constants.file_type import FileType
 from services import vector_store_service
-UPLOAD_DIR = "uploads"
-os.makedirs(UPLOAD_DIR, exist_ok=True)
 def save_file(file):
     ext = os.path.splitext(file.filename)[-1].lstrip(".")
     file_id = str(uuid.uuid4())

 import pytesseract
 from langchain_community.document_loaders import PyMuPDFLoader
 from langchain_text_splitters import RecursiveCharacterTextSplitter
+from constants.config import UPLOAD_DIR
 from constants.file_type import FileType
 from services import vector_store_service
 def save_file(file):
     ext = os.path.splitext(file.filename)[-1].lstrip(".")
     file_id = str(uuid.uuid4())

src/services/vector_store_service.py CHANGED Viewed

@@ -1,17 +1,10 @@
 from chromadb import PersistentClient
 from langchain_chroma import Chroma
 from langchain_huggingface import HuggingFaceEmbeddings
-import torch
-client = PersistentClient(path="/data")
-# EMBEDDING_MODEL = "intfloat/multilingual-e5-large-instruct"
-EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
-_device = (
-    "cuda" if torch.cuda.is_available()
-    else "mps" if torch.backends.mps.is_available()
-    else "cpu"
-)
-embeddings_function = HuggingFaceEmbeddings(model_name=EMBEDDING_MODEL, model_kwargs={'device': _device})
 vector_store = {}
 def get_all_collections_id():
@@ -25,7 +18,7 @@ def inspect_collection(collection_id: str):
 def get_vector_store(collection_name) -> Chroma:
     if collection_name not in vector_store:
         vector_store[collection_name] = Chroma(
-            persist_directory="./data",
             collection_name=collection_name,
             embedding_function=embeddings_function,
         )

 from chromadb import PersistentClient
 from langchain_chroma import Chroma
 from langchain_huggingface import HuggingFaceEmbeddings
+from constants.config import DATA_DIR, EMBEDDING_MODEL, TORCH_DEVICE
+client = PersistentClient(path=DATA_DIR)
+embeddings_function = HuggingFaceEmbeddings(model_name=EMBEDDING_MODEL, model_kwargs={'device': TORCH_DEVICE})
 vector_store = {}
 def get_all_collections_id():
 def get_vector_store(collection_name) -> Chroma:
     if collection_name not in vector_store:
         vector_store[collection_name] = Chroma(
+            persist_directory=DATA_DIR,
             collection_name=collection_name,
             embedding_function=embeddings_function,
         )

src/utils/client.py CHANGED Viewed

@@ -1,8 +1,4 @@
 import openai
-from dotenv import load_dotenv
-# Load environment variables
-load_dotenv()
 # Initialize OpenAI API client
 openai_client = openai.OpenAI(

 import openai
 # Initialize OpenAI API client
 openai_client = openai.OpenAI(

src/utils/image_pipeline.py CHANGED Viewed

@@ -1,14 +1,8 @@
 import torch
 from diffusers import StableDiffusionPipeline
-# Device setup
-_device = (
-    "cuda" if torch.cuda.is_available()
-    else "mps" if torch.backends.mps.is_available()
-    else "cpu"
-)
 torch.backends.cuda.matmul.allow_tf32 = True  # Enable TF32 for performance on CUDA
-_model_id_or_link = "stable-diffusion-v1-5/stable-diffusion-v1-5"
 _pipeline = None
@@ -17,20 +11,20 @@ def get_pipeline() -> StableDiffusionPipeline:
     if _pipeline is None:
         try:
             _pipeline = StableDiffusionPipeline.from_pretrained(
-                _model_id_or_link,
                 torch_dtype=torch.bfloat16,
                 variant="fp16",
                 # safety_checker=True,
                 use_safetensors=True,
             )
             # _pipeline = StableDiffusionPipeline.from_single_file(
-            #     _model_id_or_link,
             #     torch_dtype=torch.bfloat16,
             #     variant="fp16",
             #     # safety_checker=True,
             #     use_safetensors=True,
             # )
-            _pipeline.to(_device)
         except Exception as e:
             raise RuntimeError(f"Failed to load the model: {e}")
     return _pipeline

 import torch
 from diffusers import StableDiffusionPipeline
+from constants.config import IMAGE_MODEL_ID_OR_LINK, TORCH_DEVICE
 torch.backends.cuda.matmul.allow_tf32 = True  # Enable TF32 for performance on CUDA
 _pipeline = None
     if _pipeline is None:
         try:
             _pipeline = StableDiffusionPipeline.from_pretrained(
+                IMAGE_MODEL_ID_OR_LINK,
                 torch_dtype=torch.bfloat16,
                 variant="fp16",
                 # safety_checker=True,
                 use_safetensors=True,
             )
             # _pipeline = StableDiffusionPipeline.from_single_file(
+            #     IMAGE_MODEL_ID_OR_LINK,
             #     torch_dtype=torch.bfloat16,
             #     variant="fp16",
             #     # safety_checker=True,
             #     use_safetensors=True,
             # )
+            _pipeline.to(TORCH_DEVICE)
         except Exception as e:
             raise RuntimeError(f"Failed to load the model: {e}")
     return _pipeline