File size: 881 Bytes
bf6b252
 
dc76031
e7f9ccc
dc76031
 
 
 
 
 
 
 
 
 
b723669
dc76031
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e7f9ccc
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
#!/bin/bash

# 設定工作目錄
export WORK="/home/user/app"
cd "$WORK" || exit 1

# 建立 Python 虛擬環境
python3 -m venv venv

# 啟動虛擬環境
source venv/bin/activate

echo "Unzip and download model..."
unzip llama_cpp_avx512.zip > /dev/null 2>&1
wget -O model.gguf https://huggingface.co/Intel/gpt-oss-20b-gguf-q2ks-AutoRound/resolve/main/gpt-oss-20b-32x2.4B-Q2_K_S.gguf > /dev/null 2>&1

echo "Start llama.cpp server..."
./llama-server -m model.gguf \
                --port 8000 \
                --host 0.0.0.0 \
                --threads 2 \
                --ctx-size 4096 \
                --mlock \
                --jinja \
                --temp 0.2 \
                --top-p 0.85 &

# 安裝 Python 套件到虛擬環境
pip install --upgrade pip
pip install gradio openai

echo "Start app.py..."
python app.py

#python3 -m http.server 7860 --bind 0.0.0.0