# Base image: HF text-generation-inference server FROM ghcr.io/huggingface/text-generation-inference:latest # Environment variables ENV MODEL_ID=meta-llama/Llama-2-7b-chat-hf ENV PORT=7860 # Expose the port for the HF Space EXPOSE 7860 # Launch the HF inference server CMD ["text-generation-launcher", "--model-id", "meta-llama/Llama-2-7b-chat-hf", "--port", "7860"]