alien-commie-ifr3-k05 / Dockerfile
manbeast3b's picture
Upload folder using huggingface_hub
3f56b21 verified
FROM nvidia/cuda:12.3.2-cudnn9-devel-ubuntu22.04
# Set environment variables
ENV PYTHONUNBUFFERED=1 \
DEBIAN_FRONTEND=noninteractive \
CUDA_HOME=/usr/local/cuda \
PATH=/usr/local/cuda/bin:$PATH \
LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH \
NVIDIA_VISIBLE_DEVICES=all \
NVIDIA_DRIVER_CAPABILITIES=compute,utility \
HF_HOME=/app/models \
TRITON_CACHE_DIR=/tmp/triton_cache \
XDG_CACHE_HOME=/tmp \
NUMBA_CACHE_DIR=/tmp/numba_cache
# Install system dependencies
RUN apt-get update && apt-get install -y --no-install-recommends \
python3 \
python3-pip \
python3-dev \
build-essential \
git \
git-lfs \
ffmpeg \
libsndfile1 \
curl \
&& rm -rf /var/lib/apt/lists/*
# Initialize Git LFS
RUN git lfs install
# Upgrade pip and install build tools
RUN python3 -m pip install --upgrade pip setuptools wheel uv
WORKDIR /app
# Create Numba cache directory
RUN mkdir -p /tmp/numba_cache /tmp/triton_cache && \
chown nobody:nogroup /tmp/numba_cache /tmp/triton_cache && \
chmod 700 /tmp/numba_cache /tmp/triton_cache
COPY requirements.txt .
# Install other requirements
RUN python3 -m uv pip install --no-cache-dir -r requirements.txt --prerelease=allow
COPY . .
EXPOSE 8000
CMD ["python3", "server.py"]