Spaces:
Sleeping
Sleeping
# 設定工作目錄 | |
export WORK="/home/user/app" | |
cd "$WORK" || exit 1 | |
# 建立 Python 虛擬環境 (可選) | |
python3 -m venv venv | |
source venv/bin/activate | |
# 安裝 Python 套件 | |
pip install --upgrade pip | |
pip install gradio openai aiohttp | |
echo "Unzip and download model..." | |
unzip llama_cpp_avx512.zip > /dev/null 2>&1 | |
#wget -O model.gguf https://huggingface.co/Intel/gpt-oss-20b-gguf-q4ks-AutoRound/resolve/main/gpt-oss-20b-32x2.4B-Q4_K_S.gguf > /dev/null 2>&1 | |
wget -O model.gguf https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q4_K_M.gguf > /dev/null 2>&1 | |
echo "Start llama.cpp server..." | |
nohup ./llama-server \ | |
-m model.gguf \ | |
--port 8000 \ | |
--host 0.0.0.0 \ | |
--threads 2 \ | |
--ctx-size 16384 \ | |
--mlock \ | |
--jinja \ | |
--temp 0.2 \ | |
--top-p 0.85 \ | |
-v \ | |
> llama.log 2>&1 & | |
# 持續監控 log,但不阻塞 python app.py | |
#tail -n 50 -f llama.log & | |
#sleep 200 | |
echo "Start app.py..." | |
python app.py | |