Spaces:
Running
Running
# 設定工作目錄 | |
export WORK="/home/user/app" | |
cd "$WORK" || exit 1 | |
# 建立 Python 虛擬環境 | |
python3 -m venv venv | |
# 啟動虛擬環境 | |
source venv/bin/activate | |
echo "Unzip and download model..." | |
unzip llama_cpp_avx512.zip > /dev/null 2>&1 | |
wget -O model.gguf https://huggingface.co/Intel/gpt-oss-20b-gguf-q2ks-AutoRound/resolve/main/gpt-oss-20b-32x2.4B-Q2_K_S.gguf > /dev/null 2>&1 | |
echo "Start llama.cpp server..." | |
./llama-server -m model.gguf \ | |
--port 8000 \ | |
--host 0.0.0.0 \ | |
--threads 2 \ | |
--ctx-size 4096 \ | |
--mlock \ | |
--jinja \ | |
--temp 0.2 \ | |
--top-p 0.85 & | |
# 安裝 Python 套件到虛擬環境 | |
pip install --upgrade pip | |
pip install gradio openai | |
echo "Start app.py..." | |
python app.py | |
#python3 -m http.server 7860 --bind 0.0.0.0 |