ubuntu / Dockerfile
likhonsheikh's picture
Update Dockerfile
c6a4dcc verified
raw
history blame contribute delete
369 Bytes
# Base image: HF text-generation-inference server
FROM ghcr.io/huggingface/text-generation-inference:latest
# Environment variables
ENV MODEL_ID=meta-llama/Llama-2-7b-chat-hf
ENV PORT=7860
# Expose the port for the HF Space
EXPOSE 7860
# Launch the HF inference server
CMD ["text-generation-launcher", "--model-id", "meta-llama/Llama-2-7b-chat-hf", "--port", "7860"]