File size: 1,959 Bytes
4aaf734
 
1dba1e4
4455993
 
8c9ed7b
4455993
 
 
 
 
6d20477
 
 
 
 
 
 
 
 
 
 
 
 
d68be0e
e5ab26b
 
 
 
 
a2a4283
941538f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8c9ed7b
941538f
822a106
8c9ed7b
 
 
 
 
 
 
 
 
 
dbcf40b
8c9ed7b
a2a4283
 
230d1b0
8c9ed7b
b6f4906
4d16580
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu22.04

ENV DEBIAN_FRONTEND=noninteractive
RUN apt-get update && \
    apt-get upgrade -y && \
    apt-get install -y --no-install-recommends ca-certificates \
    git \
    git-lfs \
    wget \
    curl \
    # python build dependencies \
    build-essential \
    libssl-dev \
    zlib1g-dev \
    libbz2-dev \
    libreadline-dev \
    libsqlite3-dev \
    libncursesw5-dev \
    xz-utils \
    tk-dev \
    libxml2-dev \
    libxmlsec1-dev \
    libffi-dev \
    liblzma-dev \
    nvidia-driver-515 \
    ffmpeg

ENV USER='user'    
RUN useradd -m -u 1000 ${USER}
USER ${USER}
ENV HOME=/home/${USER}
    PATH=${HOME}/.local/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:${PATH} 
    
WORKDIR ${HOME}/app

    
RUN curl https://pyenv.run | bash
ENV PATH=${HOME}/.pyenv/shims:${HOME}/.pyenv/bin:${PATH}
ARG PYTHON_VERSION=3.10.13
RUN pyenv install ${PYTHON_VERSION} && \
    pyenv global ${PYTHON_VERSION} && \
    pyenv rehash && \
    pip install --no-cache-dir -U pip setuptools wheel && \
    pip install "huggingface-hub" "hf-transfer" "gradio[oauth]>=4.28.0" "gradio_huggingfacehub_search==0.0.7" "APScheduler"

COPY --chown=1000 . ${HOME}/app
RUN git clone https://github.com/ollama/ollama.git
RUN git clone https://github.com/ggerganov/llama.cpp
RUN pip install -r llama.cpp/requirements.txt
COPY groups_merged.txt ${HOME}/app/llama.cpp/

    
ENV PYTHONPATH=${HOME}/app \
    PYTHONUNBUFFERED=1 \
    HF_HUB_ENABLE_HF_TRANSFER=1 \
    GRADIO_ALLOW_FLAGGING=never \
    GRADIO_NUM_PORTS=1 \
    GRADIO_SERVER_NAME=0.0.0.0 \
    GRADIO_THEME=huggingface \
    TQDM_POSITION=-1 \
    TQDM_MININTERVAL=1 \
    SYSTEM=spaces \
    LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/usr/local/cuda/lib64:${LD_LIBRARY_PATH} \
    NVIDIA_DRIVER_CAPABILITIES=compute,utility \
    NVIDIA_VISIBLE_DEVICES=all \
    OLLAMA_HOST=0.0.0.0
    

# EXPOSE 11434
ENTRYPOINT /bin/sh start.sh