# Use the base image from noneabove1182/koboldcpp | |
FROM noneabove1182/koboldcpp:latest | |
# Set the working directory | |
WORKDIR /app | |
# Define environment variables directly in the Dockerfile | |
ENV MODEL_DIR=/app/models | |
ENV MODEL=LLaMA2-13B-Tiefighter.Q4_K_S.gguf | |
# Create the model directory | |
RUN mkdir -p ${MODEL_DIR} | |
# Download the model file | |
RUN apt-get update && apt-get install -y wget && \ | |
wget -O ${MODEL_DIR}/${MODEL} https://dev-motoemoto47ark123-dl-server-1.hf.space/files/LLaMA2-13B-Tiefighter.Q4_K_S.gguf | |
# Expose the port the application will run on | |
EXPOSE 8080 | |
# Set the entry point to run the application | |
CMD ["python", "koboldcpp.py", "--model", "/app/models/${MODEL}", "--port", "8080", "--usemlock"] | |