|
|
|
FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04 |
|
|
|
|
|
ENV DEBIAN_FRONTEND=noninteractive |
|
WORKDIR /home/user/app |
|
|
|
|
|
ENV OMP_NUM_THREADS=1 \ |
|
TOKENIZERS_PARALLELISM=false \ |
|
PYTHONUNBUFFERED=1 \ |
|
HF_HOME=/home/user/.cache/huggingface \ |
|
TRANSFORMERS_CACHE=/home/user/.cache/huggingface/transformers \ |
|
HF_DATASETS_CACHE=/home/user/.cache/huggingface/datasets \ |
|
OFFLOAD_DIR=/home/user/app/offload \ |
|
MERGED_MODEL_DIR=/home/user/app/merged-model \ |
|
QUANTIZE=4bit |
|
|
|
|
|
ENV NVIDIA_VISIBLE_DEVICES=all \ |
|
NVIDIA_DRIVER_CAPABILITIES=compute,utility |
|
|
|
|
|
RUN apt-get update && apt-get install -y --no-install-recommends \ |
|
python3 python3-pip git git-lfs ca-certificates && \ |
|
rm -rf /var/lib/apt/lists/* && \ |
|
git lfs install |
|
|
|
|
|
|
|
RUN python3 -m pip install --upgrade pip |
|
|
|
|
|
RUN python3 -m pip install --no-cache-dir \ |
|
--index-url https://download.pytorch.org/whl/cu121 \ |
|
torch==2.4.0 torchvision==0.19.0 torchaudio==2.4.0 |
|
|
|
|
|
COPY requirements.txt . |
|
RUN python3 -m pip install --no-cache-dir -r requirements.txt |
|
|
|
|
|
COPY . . |
|
RUN mkdir -p "$OFFLOAD_DIR" "$MERGED_MODEL_DIR" "$HF_HOME" "$TRANSFORMERS_CACHE" |
|
|
|
|
|
EXPOSE 7860 |
|
|
|
|
|
CMD ["python3", "app.py"] |
|
|
|
|