Spaces:
Running
Running
File size: 881 Bytes
bf6b252 dc76031 e7f9ccc dc76031 b723669 dc76031 e7f9ccc |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 |
#!/bin/bash
# 設定工作目錄
export WORK="/home/user/app"
cd "$WORK" || exit 1
# 建立 Python 虛擬環境
python3 -m venv venv
# 啟動虛擬環境
source venv/bin/activate
echo "Unzip and download model..."
unzip llama_cpp_avx512.zip > /dev/null 2>&1
wget -O model.gguf https://huggingface.co/Intel/gpt-oss-20b-gguf-q2ks-AutoRound/resolve/main/gpt-oss-20b-32x2.4B-Q2_K_S.gguf > /dev/null 2>&1
echo "Start llama.cpp server..."
./llama-server -m model.gguf \
--port 8000 \
--host 0.0.0.0 \
--threads 2 \
--ctx-size 4096 \
--mlock \
--jinja \
--temp 0.2 \
--top-p 0.85 &
# 安裝 Python 套件到虛擬環境
pip install --upgrade pip
pip install gradio openai
echo "Start app.py..."
python app.py
#python3 -m http.server 7860 --bind 0.0.0.0 |